1 /*
2  *	IPv6 Address [auto]configuration
3  *	Linux INET6 implementation
4  *
5  *	Authors:
6  *	Pedro Roque		<roque@di.fc.ul.pt>
7  *	Alexey Kuznetsov	<kuznet@ms2.inr.ac.ru>
8  *
9  *	This program is free software; you can redistribute it and/or
10  *      modify it under the terms of the GNU General Public License
11  *      as published by the Free Software Foundation; either version
12  *      2 of the License, or (at your option) any later version.
13  */
14 
15 /*
16  *	Changes:
17  *
18  *	Janos Farkas			:	delete timer on ifdown
19  *	<chexum@bankinf.banki.hu>
20  *	Andi Kleen			:	kill double kfree on module
21  *						unload.
22  *	Maciej W. Rozycki		:	FDDI support
23  *	sekiya@USAGI			:	Don't send too many RS
24  *						packets.
25  *	yoshfuji@USAGI			:       Fixed interval between DAD
26  *						packets.
27  *	YOSHIFUJI Hideaki @USAGI	:	improved accuracy of
28  *						address validation timer.
29  *	YOSHIFUJI Hideaki @USAGI	:	Privacy Extensions (RFC3041)
30  *						support.
31  *	Yuji SEKIYA @USAGI		:	Don't assign a same IPv6
32  *						address on a same interface.
33  *	YOSHIFUJI Hideaki @USAGI	:	ARCnet support
34  *	YOSHIFUJI Hideaki @USAGI	:	convert /proc/net/if_inet6 to
35  *						seq_file.
36  *	YOSHIFUJI Hideaki @USAGI	:	improved source address
37  *						selection; consider scope,
38  *						status etc.
39  */
40 
41 #include <linux/errno.h>
42 #include <linux/types.h>
43 #include <linux/kernel.h>
44 #include <linux/socket.h>
45 #include <linux/sockios.h>
46 #include <linux/net.h>
47 #include <linux/in6.h>
48 #include <linux/netdevice.h>
49 #include <linux/if_addr.h>
50 #include <linux/if_arp.h>
51 #include <linux/if_arcnet.h>
52 #include <linux/if_infiniband.h>
53 #include <linux/route.h>
54 #include <linux/inetdevice.h>
55 #include <linux/init.h>
56 #include <linux/slab.h>
57 #ifdef CONFIG_SYSCTL
58 #include <linux/sysctl.h>
59 #endif
60 #include <linux/capability.h>
61 #include <linux/delay.h>
62 #include <linux/notifier.h>
63 #include <linux/string.h>
64 
65 #include <net/net_namespace.h>
66 #include <net/sock.h>
67 #include <net/snmp.h>
68 
69 #include <net/ipv6.h>
70 #include <net/protocol.h>
71 #include <net/ndisc.h>
72 #include <net/ip6_route.h>
73 #include <net/addrconf.h>
74 #include <net/tcp.h>
75 #include <net/ip.h>
76 #include <net/netlink.h>
77 #include <net/pkt_sched.h>
78 #include <linux/if_tunnel.h>
79 #include <linux/rtnetlink.h>
80 
81 #ifdef CONFIG_IPV6_PRIVACY
82 #include <linux/random.h>
83 #endif
84 
85 #include <linux/uaccess.h>
86 #include <asm/unaligned.h>
87 
88 #include <linux/proc_fs.h>
89 #include <linux/seq_file.h>
90 #include <linux/export.h>
91 
92 /* Set to 3 to get tracing... */
93 #define ACONF_DEBUG 2
94 
95 #if ACONF_DEBUG >= 3
96 #define ADBG(x) printk x
97 #else
98 #define ADBG(x)
99 #endif
100 
101 #define	INFINITY_LIFE_TIME	0xFFFFFFFF
102 
cstamp_delta(unsigned long cstamp)103 static inline u32 cstamp_delta(unsigned long cstamp)
104 {
105 	return (cstamp - INITIAL_JIFFIES) * 100UL / HZ;
106 }
107 
108 #define ADDRCONF_TIMER_FUZZ_MINUS	(HZ > 50 ? HZ/50 : 1)
109 #define ADDRCONF_TIMER_FUZZ		(HZ / 4)
110 #define ADDRCONF_TIMER_FUZZ_MAX		(HZ)
111 
112 #ifdef CONFIG_SYSCTL
113 static void addrconf_sysctl_register(struct inet6_dev *idev);
114 static void addrconf_sysctl_unregister(struct inet6_dev *idev);
115 #else
addrconf_sysctl_register(struct inet6_dev * idev)116 static inline void addrconf_sysctl_register(struct inet6_dev *idev)
117 {
118 }
119 
addrconf_sysctl_unregister(struct inet6_dev * idev)120 static inline void addrconf_sysctl_unregister(struct inet6_dev *idev)
121 {
122 }
123 #endif
124 
125 #ifdef CONFIG_IPV6_PRIVACY
126 static int __ipv6_regen_rndid(struct inet6_dev *idev);
127 static int __ipv6_try_regen_rndid(struct inet6_dev *idev, struct in6_addr *tmpaddr);
128 static void ipv6_regen_rndid(unsigned long data);
129 #endif
130 
131 static int ipv6_generate_eui64(u8 *eui, struct net_device *dev);
132 static int ipv6_count_addresses(struct inet6_dev *idev);
133 
134 /*
135  *	Configured unicast address hash table
136  */
137 static struct hlist_head inet6_addr_lst[IN6_ADDR_HSIZE];
138 static DEFINE_SPINLOCK(addrconf_hash_lock);
139 
140 static void addrconf_verify(unsigned long);
141 
142 static DEFINE_TIMER(addr_chk_timer, addrconf_verify, 0, 0);
143 static DEFINE_SPINLOCK(addrconf_verify_lock);
144 
145 static void addrconf_join_anycast(struct inet6_ifaddr *ifp);
146 static void addrconf_leave_anycast(struct inet6_ifaddr *ifp);
147 
148 static void addrconf_type_change(struct net_device *dev,
149 				 unsigned long event);
150 static int addrconf_ifdown(struct net_device *dev, int how);
151 
152 static void addrconf_dad_start(struct inet6_ifaddr *ifp, u32 flags);
153 static void addrconf_dad_timer(unsigned long data);
154 static void addrconf_dad_completed(struct inet6_ifaddr *ifp);
155 static void addrconf_dad_run(struct inet6_dev *idev);
156 static void addrconf_rs_timer(unsigned long data);
157 static void __ipv6_ifa_notify(int event, struct inet6_ifaddr *ifa);
158 static void ipv6_ifa_notify(int event, struct inet6_ifaddr *ifa);
159 
160 static void inet6_prefix_notify(int event, struct inet6_dev *idev,
161 				struct prefix_info *pinfo);
162 static bool ipv6_chk_same_addr(struct net *net, const struct in6_addr *addr,
163 			       struct net_device *dev);
164 
165 static ATOMIC_NOTIFIER_HEAD(inet6addr_chain);
166 
167 static struct ipv6_devconf ipv6_devconf __read_mostly = {
168 	.forwarding		= 0,
169 	.hop_limit		= IPV6_DEFAULT_HOPLIMIT,
170 	.mtu6			= IPV6_MIN_MTU,
171 	.accept_ra		= 1,
172 	.accept_redirects	= 1,
173 	.autoconf		= 1,
174 	.force_mld_version	= 0,
175 	.dad_transmits		= 1,
176 	.rtr_solicits		= MAX_RTR_SOLICITATIONS,
177 	.rtr_solicit_interval	= RTR_SOLICITATION_INTERVAL,
178 	.rtr_solicit_delay	= MAX_RTR_SOLICITATION_DELAY,
179 #ifdef CONFIG_IPV6_PRIVACY
180 	.use_tempaddr 		= 0,
181 	.temp_valid_lft		= TEMP_VALID_LIFETIME,
182 	.temp_prefered_lft	= TEMP_PREFERRED_LIFETIME,
183 	.regen_max_retry	= REGEN_MAX_RETRY,
184 	.max_desync_factor	= MAX_DESYNC_FACTOR,
185 #endif
186 	.max_addresses		= IPV6_MAX_ADDRESSES,
187 	.accept_ra_defrtr	= 1,
188 	.accept_ra_pinfo	= 1,
189 #ifdef CONFIG_IPV6_ROUTER_PREF
190 	.accept_ra_rtr_pref	= 1,
191 	.rtr_probe_interval	= 60 * HZ,
192 #ifdef CONFIG_IPV6_ROUTE_INFO
193 	.accept_ra_rt_info_max_plen = 0,
194 #endif
195 #endif
196 	.proxy_ndp		= 0,
197 	.accept_source_route	= 0,	/* we do not accept RH0 by default. */
198 	.disable_ipv6		= 0,
199 	.accept_dad		= 1,
200 };
201 
202 static struct ipv6_devconf ipv6_devconf_dflt __read_mostly = {
203 	.forwarding		= 0,
204 	.hop_limit		= IPV6_DEFAULT_HOPLIMIT,
205 	.mtu6			= IPV6_MIN_MTU,
206 	.accept_ra		= 1,
207 	.accept_redirects	= 1,
208 	.autoconf		= 1,
209 	.dad_transmits		= 1,
210 	.rtr_solicits		= MAX_RTR_SOLICITATIONS,
211 	.rtr_solicit_interval	= RTR_SOLICITATION_INTERVAL,
212 	.rtr_solicit_delay	= MAX_RTR_SOLICITATION_DELAY,
213 #ifdef CONFIG_IPV6_PRIVACY
214 	.use_tempaddr		= 0,
215 	.temp_valid_lft		= TEMP_VALID_LIFETIME,
216 	.temp_prefered_lft	= TEMP_PREFERRED_LIFETIME,
217 	.regen_max_retry	= REGEN_MAX_RETRY,
218 	.max_desync_factor	= MAX_DESYNC_FACTOR,
219 #endif
220 	.max_addresses		= IPV6_MAX_ADDRESSES,
221 	.accept_ra_defrtr	= 1,
222 	.accept_ra_pinfo	= 1,
223 #ifdef CONFIG_IPV6_ROUTER_PREF
224 	.accept_ra_rtr_pref	= 1,
225 	.rtr_probe_interval	= 60 * HZ,
226 #ifdef CONFIG_IPV6_ROUTE_INFO
227 	.accept_ra_rt_info_max_plen = 0,
228 #endif
229 #endif
230 	.proxy_ndp		= 0,
231 	.accept_source_route	= 0,	/* we do not accept RH0 by default. */
232 	.disable_ipv6		= 0,
233 	.accept_dad		= 1,
234 };
235 
236 /* IPv6 Wildcard Address and Loopback Address defined by RFC2553 */
237 const struct in6_addr in6addr_any = IN6ADDR_ANY_INIT;
238 const struct in6_addr in6addr_loopback = IN6ADDR_LOOPBACK_INIT;
239 const struct in6_addr in6addr_linklocal_allnodes = IN6ADDR_LINKLOCAL_ALLNODES_INIT;
240 const struct in6_addr in6addr_linklocal_allrouters = IN6ADDR_LINKLOCAL_ALLROUTERS_INIT;
241 
242 /* Check if a valid qdisc is available */
addrconf_qdisc_ok(const struct net_device * dev)243 static inline bool addrconf_qdisc_ok(const struct net_device *dev)
244 {
245 	return !qdisc_tx_is_noop(dev);
246 }
247 
248 /* Check if a route is valid prefix route */
addrconf_is_prefix_route(const struct rt6_info * rt)249 static inline int addrconf_is_prefix_route(const struct rt6_info *rt)
250 {
251 	return (rt->rt6i_flags & (RTF_GATEWAY | RTF_DEFAULT)) == 0;
252 }
253 
addrconf_del_timer(struct inet6_ifaddr * ifp)254 static void addrconf_del_timer(struct inet6_ifaddr *ifp)
255 {
256 	if (del_timer(&ifp->timer))
257 		__in6_ifa_put(ifp);
258 }
259 
260 enum addrconf_timer_t {
261 	AC_NONE,
262 	AC_DAD,
263 	AC_RS,
264 };
265 
addrconf_mod_timer(struct inet6_ifaddr * ifp,enum addrconf_timer_t what,unsigned long when)266 static void addrconf_mod_timer(struct inet6_ifaddr *ifp,
267 			       enum addrconf_timer_t what,
268 			       unsigned long when)
269 {
270 	if (!del_timer(&ifp->timer))
271 		in6_ifa_hold(ifp);
272 
273 	switch (what) {
274 	case AC_DAD:
275 		ifp->timer.function = addrconf_dad_timer;
276 		break;
277 	case AC_RS:
278 		ifp->timer.function = addrconf_rs_timer;
279 		break;
280 	default:
281 		break;
282 	}
283 	ifp->timer.expires = jiffies + when;
284 	add_timer(&ifp->timer);
285 }
286 
snmp6_alloc_dev(struct inet6_dev * idev)287 static int snmp6_alloc_dev(struct inet6_dev *idev)
288 {
289 	if (snmp_mib_init((void __percpu **)idev->stats.ipv6,
290 			  sizeof(struct ipstats_mib),
291 			  __alignof__(struct ipstats_mib)) < 0)
292 		goto err_ip;
293 	idev->stats.icmpv6dev = kzalloc(sizeof(struct icmpv6_mib_device),
294 					GFP_KERNEL);
295 	if (!idev->stats.icmpv6dev)
296 		goto err_icmp;
297 	idev->stats.icmpv6msgdev = kzalloc(sizeof(struct icmpv6msg_mib_device),
298 					   GFP_KERNEL);
299 	if (!idev->stats.icmpv6msgdev)
300 		goto err_icmpmsg;
301 
302 	return 0;
303 
304 err_icmpmsg:
305 	kfree(idev->stats.icmpv6dev);
306 err_icmp:
307 	snmp_mib_free((void __percpu **)idev->stats.ipv6);
308 err_ip:
309 	return -ENOMEM;
310 }
311 
snmp6_free_dev(struct inet6_dev * idev)312 static void snmp6_free_dev(struct inet6_dev *idev)
313 {
314 	kfree(idev->stats.icmpv6msgdev);
315 	kfree(idev->stats.icmpv6dev);
316 	snmp_mib_free((void __percpu **)idev->stats.ipv6);
317 }
318 
319 /* Nobody refers to this device, we may destroy it. */
320 
in6_dev_finish_destroy(struct inet6_dev * idev)321 void in6_dev_finish_destroy(struct inet6_dev *idev)
322 {
323 	struct net_device *dev = idev->dev;
324 
325 	WARN_ON(!list_empty(&idev->addr_list));
326 	WARN_ON(idev->mc_list != NULL);
327 
328 #ifdef NET_REFCNT_DEBUG
329 	printk(KERN_DEBUG "in6_dev_finish_destroy: %s\n", dev ? dev->name : "NIL");
330 #endif
331 	dev_put(dev);
332 	if (!idev->dead) {
333 		pr_warning("Freeing alive inet6 device %p\n", idev);
334 		return;
335 	}
336 	snmp6_free_dev(idev);
337 	kfree_rcu(idev, rcu);
338 }
339 
340 EXPORT_SYMBOL(in6_dev_finish_destroy);
341 
ipv6_add_dev(struct net_device * dev)342 static struct inet6_dev * ipv6_add_dev(struct net_device *dev)
343 {
344 	struct inet6_dev *ndev;
345 
346 	ASSERT_RTNL();
347 
348 	if (dev->mtu < IPV6_MIN_MTU)
349 		return NULL;
350 
351 	ndev = kzalloc(sizeof(struct inet6_dev), GFP_KERNEL);
352 
353 	if (ndev == NULL)
354 		return NULL;
355 
356 	rwlock_init(&ndev->lock);
357 	ndev->dev = dev;
358 	INIT_LIST_HEAD(&ndev->addr_list);
359 
360 	memcpy(&ndev->cnf, dev_net(dev)->ipv6.devconf_dflt, sizeof(ndev->cnf));
361 	ndev->cnf.mtu6 = dev->mtu;
362 	ndev->cnf.sysctl = NULL;
363 	ndev->nd_parms = neigh_parms_alloc(dev, &nd_tbl);
364 	if (ndev->nd_parms == NULL) {
365 		kfree(ndev);
366 		return NULL;
367 	}
368 	if (ndev->cnf.forwarding)
369 		dev_disable_lro(dev);
370 	/* We refer to the device */
371 	dev_hold(dev);
372 
373 	if (snmp6_alloc_dev(ndev) < 0) {
374 		ADBG((KERN_WARNING
375 			"%s(): cannot allocate memory for statistics; dev=%s.\n",
376 			__func__, dev->name));
377 		neigh_parms_release(&nd_tbl, ndev->nd_parms);
378 		dev_put(dev);
379 		kfree(ndev);
380 		return NULL;
381 	}
382 
383 	if (snmp6_register_dev(ndev) < 0) {
384 		ADBG((KERN_WARNING
385 			"%s(): cannot create /proc/net/dev_snmp6/%s\n",
386 			__func__, dev->name));
387 		neigh_parms_release(&nd_tbl, ndev->nd_parms);
388 		ndev->dead = 1;
389 		in6_dev_finish_destroy(ndev);
390 		return NULL;
391 	}
392 
393 	/* One reference from device.  We must do this before
394 	 * we invoke __ipv6_regen_rndid().
395 	 */
396 	in6_dev_hold(ndev);
397 
398 	if (dev->flags & (IFF_NOARP | IFF_LOOPBACK))
399 		ndev->cnf.accept_dad = -1;
400 
401 #if defined(CONFIG_IPV6_SIT) || defined(CONFIG_IPV6_SIT_MODULE)
402 	if (dev->type == ARPHRD_SIT && (dev->priv_flags & IFF_ISATAP)) {
403 		printk(KERN_INFO
404 		       "%s: Disabled Multicast RS\n",
405 		       dev->name);
406 		ndev->cnf.rtr_solicits = 0;
407 	}
408 #endif
409 
410 #ifdef CONFIG_IPV6_PRIVACY
411 	INIT_LIST_HEAD(&ndev->tempaddr_list);
412 	setup_timer(&ndev->regen_timer, ipv6_regen_rndid, (unsigned long)ndev);
413 	if ((dev->flags&IFF_LOOPBACK) ||
414 	    dev->type == ARPHRD_TUNNEL ||
415 	    dev->type == ARPHRD_TUNNEL6 ||
416 	    dev->type == ARPHRD_SIT ||
417 	    dev->type == ARPHRD_NONE) {
418 		ndev->cnf.use_tempaddr = -1;
419 	} else {
420 		in6_dev_hold(ndev);
421 		ipv6_regen_rndid((unsigned long) ndev);
422 	}
423 #endif
424 
425 	if (netif_running(dev) && addrconf_qdisc_ok(dev))
426 		ndev->if_flags |= IF_READY;
427 
428 	ipv6_mc_init_dev(ndev);
429 	ndev->tstamp = jiffies;
430 	addrconf_sysctl_register(ndev);
431 	/* protected by rtnl_lock */
432 	rcu_assign_pointer(dev->ip6_ptr, ndev);
433 
434 	/* Join all-node multicast group */
435 	ipv6_dev_mc_inc(dev, &in6addr_linklocal_allnodes);
436 
437 	/* Join all-router multicast group if forwarding is set */
438 	if (ndev->cnf.forwarding && (dev->flags & IFF_MULTICAST))
439 		ipv6_dev_mc_inc(dev, &in6addr_linklocal_allrouters);
440 
441 	return ndev;
442 }
443 
ipv6_find_idev(struct net_device * dev)444 static struct inet6_dev * ipv6_find_idev(struct net_device *dev)
445 {
446 	struct inet6_dev *idev;
447 
448 	ASSERT_RTNL();
449 
450 	idev = __in6_dev_get(dev);
451 	if (!idev) {
452 		idev = ipv6_add_dev(dev);
453 		if (!idev)
454 			return NULL;
455 	}
456 
457 	if (dev->flags&IFF_UP)
458 		ipv6_mc_up(idev);
459 	return idev;
460 }
461 
462 #ifdef CONFIG_SYSCTL
dev_forward_change(struct inet6_dev * idev)463 static void dev_forward_change(struct inet6_dev *idev)
464 {
465 	struct net_device *dev;
466 	struct inet6_ifaddr *ifa;
467 
468 	if (!idev)
469 		return;
470 	dev = idev->dev;
471 	if (idev->cnf.forwarding)
472 		dev_disable_lro(dev);
473 	if (dev && (dev->flags & IFF_MULTICAST)) {
474 		if (idev->cnf.forwarding)
475 			ipv6_dev_mc_inc(dev, &in6addr_linklocal_allrouters);
476 		else
477 			ipv6_dev_mc_dec(dev, &in6addr_linklocal_allrouters);
478 	}
479 
480 	list_for_each_entry(ifa, &idev->addr_list, if_list) {
481 		if (ifa->flags&IFA_F_TENTATIVE)
482 			continue;
483 		if (idev->cnf.forwarding)
484 			addrconf_join_anycast(ifa);
485 		else
486 			addrconf_leave_anycast(ifa);
487 	}
488 }
489 
490 
addrconf_forward_change(struct net * net,__s32 newf)491 static void addrconf_forward_change(struct net *net, __s32 newf)
492 {
493 	struct net_device *dev;
494 	struct inet6_dev *idev;
495 
496 	for_each_netdev(net, dev) {
497 		idev = __in6_dev_get(dev);
498 		if (idev) {
499 			int changed = (!idev->cnf.forwarding) ^ (!newf);
500 			idev->cnf.forwarding = newf;
501 			if (changed)
502 				dev_forward_change(idev);
503 		}
504 	}
505 }
506 
addrconf_fixup_forwarding(struct ctl_table * table,int * p,int newf)507 static int addrconf_fixup_forwarding(struct ctl_table *table, int *p, int newf)
508 {
509 	struct net *net;
510 	int old;
511 
512 	if (!rtnl_trylock())
513 		return restart_syscall();
514 
515 	net = (struct net *)table->extra2;
516 	old = *p;
517 	*p = newf;
518 
519 	if (p == &net->ipv6.devconf_dflt->forwarding) {
520 		rtnl_unlock();
521 		return 0;
522 	}
523 
524 	if (p == &net->ipv6.devconf_all->forwarding) {
525 		net->ipv6.devconf_dflt->forwarding = newf;
526 		addrconf_forward_change(net, newf);
527 	} else if ((!newf) ^ (!old))
528 		dev_forward_change((struct inet6_dev *)table->extra1);
529 	rtnl_unlock();
530 
531 	if (newf)
532 		rt6_purge_dflt_routers(net);
533 	return 1;
534 }
535 #endif
536 
537 /* Nobody refers to this ifaddr, destroy it */
inet6_ifa_finish_destroy(struct inet6_ifaddr * ifp)538 void inet6_ifa_finish_destroy(struct inet6_ifaddr *ifp)
539 {
540 	WARN_ON(!hlist_unhashed(&ifp->addr_lst));
541 
542 #ifdef NET_REFCNT_DEBUG
543 	printk(KERN_DEBUG "inet6_ifa_finish_destroy\n");
544 #endif
545 
546 	in6_dev_put(ifp->idev);
547 
548 	if (del_timer(&ifp->timer))
549 		pr_notice("Timer is still running, when freeing ifa=%p\n", ifp);
550 
551 	if (ifp->state != INET6_IFADDR_STATE_DEAD) {
552 		pr_warning("Freeing alive inet6 address %p\n", ifp);
553 		return;
554 	}
555 	dst_release(&ifp->rt->dst);
556 
557 	kfree_rcu(ifp, rcu);
558 }
559 
560 static void
ipv6_link_dev_addr(struct inet6_dev * idev,struct inet6_ifaddr * ifp)561 ipv6_link_dev_addr(struct inet6_dev *idev, struct inet6_ifaddr *ifp)
562 {
563 	struct list_head *p;
564 	int ifp_scope = ipv6_addr_src_scope(&ifp->addr);
565 
566 	/*
567 	 * Each device address list is sorted in order of scope -
568 	 * global before linklocal.
569 	 */
570 	list_for_each(p, &idev->addr_list) {
571 		struct inet6_ifaddr *ifa
572 			= list_entry(p, struct inet6_ifaddr, if_list);
573 		if (ifp_scope >= ipv6_addr_src_scope(&ifa->addr))
574 			break;
575 	}
576 
577 	list_add_tail(&ifp->if_list, p);
578 }
579 
ipv6_addr_hash(const struct in6_addr * addr)580 static u32 ipv6_addr_hash(const struct in6_addr *addr)
581 {
582 	/*
583 	 * We perform the hash function over the last 64 bits of the address
584 	 * This will include the IEEE address token on links that support it.
585 	 */
586 	return jhash_2words((__force u32)addr->s6_addr32[2],
587 			    (__force u32)addr->s6_addr32[3], 0)
588 		& (IN6_ADDR_HSIZE - 1);
589 }
590 
591 /* On success it returns ifp with increased reference count */
592 
593 static struct inet6_ifaddr *
ipv6_add_addr(struct inet6_dev * idev,const struct in6_addr * addr,int pfxlen,int scope,u32 flags)594 ipv6_add_addr(struct inet6_dev *idev, const struct in6_addr *addr, int pfxlen,
595 	      int scope, u32 flags)
596 {
597 	struct inet6_ifaddr *ifa = NULL;
598 	struct rt6_info *rt;
599 	unsigned int hash;
600 	int err = 0;
601 	int addr_type = ipv6_addr_type(addr);
602 
603 	if (addr_type == IPV6_ADDR_ANY ||
604 	    addr_type & IPV6_ADDR_MULTICAST ||
605 	    (!(idev->dev->flags & IFF_LOOPBACK) &&
606 	     addr_type & IPV6_ADDR_LOOPBACK))
607 		return ERR_PTR(-EADDRNOTAVAIL);
608 
609 	rcu_read_lock_bh();
610 	if (idev->dead) {
611 		err = -ENODEV;			/*XXX*/
612 		goto out2;
613 	}
614 
615 	if (idev->cnf.disable_ipv6) {
616 		err = -EACCES;
617 		goto out2;
618 	}
619 
620 	spin_lock(&addrconf_hash_lock);
621 
622 	/* Ignore adding duplicate addresses on an interface */
623 	if (ipv6_chk_same_addr(dev_net(idev->dev), addr, idev->dev)) {
624 		ADBG(("ipv6_add_addr: already assigned\n"));
625 		err = -EEXIST;
626 		goto out;
627 	}
628 
629 	ifa = kzalloc(sizeof(struct inet6_ifaddr), GFP_ATOMIC);
630 
631 	if (ifa == NULL) {
632 		ADBG(("ipv6_add_addr: malloc failed\n"));
633 		err = -ENOBUFS;
634 		goto out;
635 	}
636 
637 	rt = addrconf_dst_alloc(idev, addr, false);
638 	if (IS_ERR(rt)) {
639 		err = PTR_ERR(rt);
640 		goto out;
641 	}
642 
643 	ifa->addr = *addr;
644 
645 	spin_lock_init(&ifa->lock);
646 	spin_lock_init(&ifa->state_lock);
647 	init_timer(&ifa->timer);
648 	INIT_HLIST_NODE(&ifa->addr_lst);
649 	ifa->timer.data = (unsigned long) ifa;
650 	ifa->scope = scope;
651 	ifa->prefix_len = pfxlen;
652 	ifa->flags = flags | IFA_F_TENTATIVE;
653 	ifa->cstamp = ifa->tstamp = jiffies;
654 
655 	ifa->rt = rt;
656 
657 	ifa->idev = idev;
658 	in6_dev_hold(idev);
659 	/* For caller */
660 	in6_ifa_hold(ifa);
661 
662 	/* Add to big hash table */
663 	hash = ipv6_addr_hash(addr);
664 
665 	hlist_add_head_rcu(&ifa->addr_lst, &inet6_addr_lst[hash]);
666 	spin_unlock(&addrconf_hash_lock);
667 
668 	write_lock(&idev->lock);
669 	/* Add to inet6_dev unicast addr list. */
670 	ipv6_link_dev_addr(idev, ifa);
671 
672 #ifdef CONFIG_IPV6_PRIVACY
673 	if (ifa->flags&IFA_F_TEMPORARY) {
674 		list_add(&ifa->tmp_list, &idev->tempaddr_list);
675 		in6_ifa_hold(ifa);
676 	}
677 #endif
678 
679 	in6_ifa_hold(ifa);
680 	write_unlock(&idev->lock);
681 out2:
682 	rcu_read_unlock_bh();
683 
684 	if (likely(err == 0))
685 		atomic_notifier_call_chain(&inet6addr_chain, NETDEV_UP, ifa);
686 	else {
687 		kfree(ifa);
688 		ifa = ERR_PTR(err);
689 	}
690 
691 	return ifa;
692 out:
693 	spin_unlock(&addrconf_hash_lock);
694 	goto out2;
695 }
696 
697 /* This function wants to get referenced ifp and releases it before return */
698 
ipv6_del_addr(struct inet6_ifaddr * ifp)699 static void ipv6_del_addr(struct inet6_ifaddr *ifp)
700 {
701 	struct inet6_ifaddr *ifa, *ifn;
702 	struct inet6_dev *idev = ifp->idev;
703 	int state;
704 	int deleted = 0, onlink = 0;
705 	unsigned long expires = jiffies;
706 
707 	spin_lock_bh(&ifp->state_lock);
708 	state = ifp->state;
709 	ifp->state = INET6_IFADDR_STATE_DEAD;
710 	spin_unlock_bh(&ifp->state_lock);
711 
712 	if (state == INET6_IFADDR_STATE_DEAD)
713 		goto out;
714 
715 	spin_lock_bh(&addrconf_hash_lock);
716 	hlist_del_init_rcu(&ifp->addr_lst);
717 	spin_unlock_bh(&addrconf_hash_lock);
718 
719 	write_lock_bh(&idev->lock);
720 #ifdef CONFIG_IPV6_PRIVACY
721 	if (ifp->flags&IFA_F_TEMPORARY) {
722 		list_del(&ifp->tmp_list);
723 		if (ifp->ifpub) {
724 			in6_ifa_put(ifp->ifpub);
725 			ifp->ifpub = NULL;
726 		}
727 		__in6_ifa_put(ifp);
728 	}
729 #endif
730 
731 	list_for_each_entry_safe(ifa, ifn, &idev->addr_list, if_list) {
732 		if (ifa == ifp) {
733 			list_del_init(&ifp->if_list);
734 			__in6_ifa_put(ifp);
735 
736 			if (!(ifp->flags & IFA_F_PERMANENT) || onlink > 0)
737 				break;
738 			deleted = 1;
739 			continue;
740 		} else if (ifp->flags & IFA_F_PERMANENT) {
741 			if (ipv6_prefix_equal(&ifa->addr, &ifp->addr,
742 					      ifp->prefix_len)) {
743 				if (ifa->flags & IFA_F_PERMANENT) {
744 					onlink = 1;
745 					if (deleted)
746 						break;
747 				} else {
748 					unsigned long lifetime;
749 
750 					if (!onlink)
751 						onlink = -1;
752 
753 					spin_lock(&ifa->lock);
754 
755 					lifetime = addrconf_timeout_fixup(ifa->valid_lft, HZ);
756 					/*
757 					 * Note: Because this address is
758 					 * not permanent, lifetime <
759 					 * LONG_MAX / HZ here.
760 					 */
761 					if (time_before(expires,
762 							ifa->tstamp + lifetime * HZ))
763 						expires = ifa->tstamp + lifetime * HZ;
764 					spin_unlock(&ifa->lock);
765 				}
766 			}
767 		}
768 	}
769 	write_unlock_bh(&idev->lock);
770 
771 	addrconf_del_timer(ifp);
772 
773 	ipv6_ifa_notify(RTM_DELADDR, ifp);
774 
775 	atomic_notifier_call_chain(&inet6addr_chain, NETDEV_DOWN, ifp);
776 
777 	/*
778 	 * Purge or update corresponding prefix
779 	 *
780 	 * 1) we don't purge prefix here if address was not permanent.
781 	 *    prefix is managed by its own lifetime.
782 	 * 2) if there're no addresses, delete prefix.
783 	 * 3) if there're still other permanent address(es),
784 	 *    corresponding prefix is still permanent.
785 	 * 4) otherwise, update prefix lifetime to the
786 	 *    longest valid lifetime among the corresponding
787 	 *    addresses on the device.
788 	 *    Note: subsequent RA will update lifetime.
789 	 *
790 	 * --yoshfuji
791 	 */
792 	if ((ifp->flags & IFA_F_PERMANENT) && onlink < 1) {
793 		struct in6_addr prefix;
794 		struct rt6_info *rt;
795 		struct net *net = dev_net(ifp->idev->dev);
796 		struct flowi6 fl6 = {};
797 
798 		ipv6_addr_prefix(&prefix, &ifp->addr, ifp->prefix_len);
799 		fl6.flowi6_oif = ifp->idev->dev->ifindex;
800 		fl6.daddr = prefix;
801 		rt = (struct rt6_info *)ip6_route_lookup(net, &fl6,
802 							 RT6_LOOKUP_F_IFACE);
803 
804 		if (rt != net->ipv6.ip6_null_entry &&
805 		    addrconf_is_prefix_route(rt)) {
806 			if (onlink == 0) {
807 				ip6_del_rt(rt);
808 				rt = NULL;
809 			} else if (!(rt->rt6i_flags & RTF_EXPIRES)) {
810 				rt6_set_expires(rt, expires);
811 			}
812 		}
813 		dst_release(&rt->dst);
814 	}
815 
816 	/* clean up prefsrc entries */
817 	rt6_remove_prefsrc(ifp);
818 out:
819 	in6_ifa_put(ifp);
820 }
821 
822 #ifdef CONFIG_IPV6_PRIVACY
ipv6_create_tempaddr(struct inet6_ifaddr * ifp,struct inet6_ifaddr * ift)823 static int ipv6_create_tempaddr(struct inet6_ifaddr *ifp, struct inet6_ifaddr *ift)
824 {
825 	struct inet6_dev *idev = ifp->idev;
826 	struct in6_addr addr, *tmpaddr;
827 	unsigned long tmp_prefered_lft, tmp_valid_lft, tmp_tstamp, age;
828 	unsigned long regen_advance;
829 	int tmp_plen;
830 	int ret = 0;
831 	int max_addresses;
832 	u32 addr_flags;
833 	unsigned long now = jiffies;
834 
835 	write_lock(&idev->lock);
836 	if (ift) {
837 		spin_lock_bh(&ift->lock);
838 		memcpy(&addr.s6_addr[8], &ift->addr.s6_addr[8], 8);
839 		spin_unlock_bh(&ift->lock);
840 		tmpaddr = &addr;
841 	} else {
842 		tmpaddr = NULL;
843 	}
844 retry:
845 	in6_dev_hold(idev);
846 	if (idev->cnf.use_tempaddr <= 0) {
847 		write_unlock(&idev->lock);
848 		printk(KERN_INFO
849 			"ipv6_create_tempaddr(): use_tempaddr is disabled.\n");
850 		in6_dev_put(idev);
851 		ret = -1;
852 		goto out;
853 	}
854 	spin_lock_bh(&ifp->lock);
855 	if (ifp->regen_count++ >= idev->cnf.regen_max_retry) {
856 		idev->cnf.use_tempaddr = -1;	/*XXX*/
857 		spin_unlock_bh(&ifp->lock);
858 		write_unlock(&idev->lock);
859 		printk(KERN_WARNING
860 			"ipv6_create_tempaddr(): regeneration time exceeded. disabled temporary address support.\n");
861 		in6_dev_put(idev);
862 		ret = -1;
863 		goto out;
864 	}
865 	in6_ifa_hold(ifp);
866 	memcpy(addr.s6_addr, ifp->addr.s6_addr, 8);
867 	if (__ipv6_try_regen_rndid(idev, tmpaddr) < 0) {
868 		spin_unlock_bh(&ifp->lock);
869 		write_unlock(&idev->lock);
870 		printk(KERN_WARNING
871 			"ipv6_create_tempaddr(): regeneration of randomized interface id failed.\n");
872 		in6_ifa_put(ifp);
873 		in6_dev_put(idev);
874 		ret = -1;
875 		goto out;
876 	}
877 	memcpy(&addr.s6_addr[8], idev->rndid, 8);
878 	age = (now - ifp->tstamp) / HZ;
879 	tmp_valid_lft = min_t(__u32,
880 			      ifp->valid_lft,
881 			      idev->cnf.temp_valid_lft + age);
882 	tmp_prefered_lft = min_t(__u32,
883 				 ifp->prefered_lft,
884 				 idev->cnf.temp_prefered_lft + age -
885 				 idev->cnf.max_desync_factor);
886 	tmp_plen = ifp->prefix_len;
887 	max_addresses = idev->cnf.max_addresses;
888 	tmp_tstamp = ifp->tstamp;
889 	spin_unlock_bh(&ifp->lock);
890 
891 	regen_advance = idev->cnf.regen_max_retry *
892 	                idev->cnf.dad_transmits *
893 	                idev->nd_parms->retrans_time / HZ;
894 	write_unlock(&idev->lock);
895 
896 	/* A temporary address is created only if this calculated Preferred
897 	 * Lifetime is greater than REGEN_ADVANCE time units.  In particular,
898 	 * an implementation must not create a temporary address with a zero
899 	 * Preferred Lifetime.
900 	 * Use age calculation as in addrconf_verify to avoid unnecessary
901 	 * temporary addresses being generated.
902 	 */
903 	age = (now - tmp_tstamp + ADDRCONF_TIMER_FUZZ_MINUS) / HZ;
904 	if (tmp_prefered_lft <= regen_advance + age) {
905 		in6_ifa_put(ifp);
906 		in6_dev_put(idev);
907 		ret = -1;
908 		goto out;
909 	}
910 
911 	addr_flags = IFA_F_TEMPORARY;
912 	/* set in addrconf_prefix_rcv() */
913 	if (ifp->flags & IFA_F_OPTIMISTIC)
914 		addr_flags |= IFA_F_OPTIMISTIC;
915 
916 	ift = ipv6_add_addr(idev, &addr, tmp_plen,
917 			    ipv6_addr_type(&addr)&IPV6_ADDR_SCOPE_MASK,
918 			    addr_flags);
919 	if (IS_ERR(ift)) {
920 		in6_ifa_put(ifp);
921 		in6_dev_put(idev);
922 		printk(KERN_INFO
923 			"ipv6_create_tempaddr(): retry temporary address regeneration.\n");
924 		tmpaddr = &addr;
925 		write_lock(&idev->lock);
926 		goto retry;
927 	}
928 
929 	spin_lock_bh(&ift->lock);
930 	ift->ifpub = ifp;
931 	ift->valid_lft = tmp_valid_lft;
932 	ift->prefered_lft = tmp_prefered_lft;
933 	ift->cstamp = now;
934 	ift->tstamp = tmp_tstamp;
935 	spin_unlock_bh(&ift->lock);
936 
937 	addrconf_dad_start(ift, 0);
938 	in6_ifa_put(ift);
939 	in6_dev_put(idev);
940 out:
941 	return ret;
942 }
943 #endif
944 
945 /*
946  *	Choose an appropriate source address (RFC3484)
947  */
948 enum {
949 	IPV6_SADDR_RULE_INIT = 0,
950 	IPV6_SADDR_RULE_LOCAL,
951 	IPV6_SADDR_RULE_SCOPE,
952 	IPV6_SADDR_RULE_PREFERRED,
953 #ifdef CONFIG_IPV6_MIP6
954 	IPV6_SADDR_RULE_HOA,
955 #endif
956 	IPV6_SADDR_RULE_OIF,
957 	IPV6_SADDR_RULE_LABEL,
958 #ifdef CONFIG_IPV6_PRIVACY
959 	IPV6_SADDR_RULE_PRIVACY,
960 #endif
961 	IPV6_SADDR_RULE_ORCHID,
962 	IPV6_SADDR_RULE_PREFIX,
963 	IPV6_SADDR_RULE_MAX
964 };
965 
966 struct ipv6_saddr_score {
967 	int			rule;
968 	int			addr_type;
969 	struct inet6_ifaddr	*ifa;
970 	DECLARE_BITMAP(scorebits, IPV6_SADDR_RULE_MAX);
971 	int			scopedist;
972 	int			matchlen;
973 };
974 
975 struct ipv6_saddr_dst {
976 	const struct in6_addr *addr;
977 	int ifindex;
978 	int scope;
979 	int label;
980 	unsigned int prefs;
981 };
982 
ipv6_saddr_preferred(int type)983 static inline int ipv6_saddr_preferred(int type)
984 {
985 	if (type & (IPV6_ADDR_MAPPED|IPV6_ADDR_COMPATv4|IPV6_ADDR_LOOPBACK))
986 		return 1;
987 	return 0;
988 }
989 
ipv6_get_saddr_eval(struct net * net,struct ipv6_saddr_score * score,struct ipv6_saddr_dst * dst,int i)990 static int ipv6_get_saddr_eval(struct net *net,
991 			       struct ipv6_saddr_score *score,
992 			       struct ipv6_saddr_dst *dst,
993 			       int i)
994 {
995 	int ret;
996 
997 	if (i <= score->rule) {
998 		switch (i) {
999 		case IPV6_SADDR_RULE_SCOPE:
1000 			ret = score->scopedist;
1001 			break;
1002 		case IPV6_SADDR_RULE_PREFIX:
1003 			ret = score->matchlen;
1004 			break;
1005 		default:
1006 			ret = !!test_bit(i, score->scorebits);
1007 		}
1008 		goto out;
1009 	}
1010 
1011 	switch (i) {
1012 	case IPV6_SADDR_RULE_INIT:
1013 		/* Rule 0: remember if hiscore is not ready yet */
1014 		ret = !!score->ifa;
1015 		break;
1016 	case IPV6_SADDR_RULE_LOCAL:
1017 		/* Rule 1: Prefer same address */
1018 		ret = ipv6_addr_equal(&score->ifa->addr, dst->addr);
1019 		break;
1020 	case IPV6_SADDR_RULE_SCOPE:
1021 		/* Rule 2: Prefer appropriate scope
1022 		 *
1023 		 *      ret
1024 		 *       ^
1025 		 *    -1 |  d 15
1026 		 *    ---+--+-+---> scope
1027 		 *       |
1028 		 *       |             d is scope of the destination.
1029 		 *  B-d  |  \
1030 		 *       |   \      <- smaller scope is better if
1031 		 *  B-15 |    \        if scope is enough for destinaion.
1032 		 *       |             ret = B - scope (-1 <= scope >= d <= 15).
1033 		 * d-C-1 | /
1034 		 *       |/         <- greater is better
1035 		 *   -C  /             if scope is not enough for destination.
1036 		 *      /|             ret = scope - C (-1 <= d < scope <= 15).
1037 		 *
1038 		 * d - C - 1 < B -15 (for all -1 <= d <= 15).
1039 		 * C > d + 14 - B >= 15 + 14 - B = 29 - B.
1040 		 * Assume B = 0 and we get C > 29.
1041 		 */
1042 		ret = __ipv6_addr_src_scope(score->addr_type);
1043 		if (ret >= dst->scope)
1044 			ret = -ret;
1045 		else
1046 			ret -= 128;	/* 30 is enough */
1047 		score->scopedist = ret;
1048 		break;
1049 	case IPV6_SADDR_RULE_PREFERRED:
1050 		/* Rule 3: Avoid deprecated and optimistic addresses */
1051 		ret = ipv6_saddr_preferred(score->addr_type) ||
1052 		      !(score->ifa->flags & (IFA_F_DEPRECATED|IFA_F_OPTIMISTIC));
1053 		break;
1054 #ifdef CONFIG_IPV6_MIP6
1055 	case IPV6_SADDR_RULE_HOA:
1056 	    {
1057 		/* Rule 4: Prefer home address */
1058 		int prefhome = !(dst->prefs & IPV6_PREFER_SRC_COA);
1059 		ret = !(score->ifa->flags & IFA_F_HOMEADDRESS) ^ prefhome;
1060 		break;
1061 	    }
1062 #endif
1063 	case IPV6_SADDR_RULE_OIF:
1064 		/* Rule 5: Prefer outgoing interface */
1065 		ret = (!dst->ifindex ||
1066 		       dst->ifindex == score->ifa->idev->dev->ifindex);
1067 		break;
1068 	case IPV6_SADDR_RULE_LABEL:
1069 		/* Rule 6: Prefer matching label */
1070 		ret = ipv6_addr_label(net,
1071 				      &score->ifa->addr, score->addr_type,
1072 				      score->ifa->idev->dev->ifindex) == dst->label;
1073 		break;
1074 #ifdef CONFIG_IPV6_PRIVACY
1075 	case IPV6_SADDR_RULE_PRIVACY:
1076 	    {
1077 		/* Rule 7: Prefer public address
1078 		 * Note: prefer temporary address if use_tempaddr >= 2
1079 		 */
1080 		int preftmp = dst->prefs & (IPV6_PREFER_SRC_PUBLIC|IPV6_PREFER_SRC_TMP) ?
1081 				!!(dst->prefs & IPV6_PREFER_SRC_TMP) :
1082 				score->ifa->idev->cnf.use_tempaddr >= 2;
1083 		ret = (!(score->ifa->flags & IFA_F_TEMPORARY)) ^ preftmp;
1084 		break;
1085 	    }
1086 #endif
1087 	case IPV6_SADDR_RULE_ORCHID:
1088 		/* Rule 8-: Prefer ORCHID vs ORCHID or
1089 		 *	    non-ORCHID vs non-ORCHID
1090 		 */
1091 		ret = !(ipv6_addr_orchid(&score->ifa->addr) ^
1092 			ipv6_addr_orchid(dst->addr));
1093 		break;
1094 	case IPV6_SADDR_RULE_PREFIX:
1095 		/* Rule 8: Use longest matching prefix */
1096 		score->matchlen = ret = ipv6_addr_diff(&score->ifa->addr,
1097 						       dst->addr);
1098 		break;
1099 	default:
1100 		ret = 0;
1101 	}
1102 
1103 	if (ret)
1104 		__set_bit(i, score->scorebits);
1105 	score->rule = i;
1106 out:
1107 	return ret;
1108 }
1109 
ipv6_dev_get_saddr(struct net * net,struct net_device * dst_dev,const struct in6_addr * daddr,unsigned int prefs,struct in6_addr * saddr)1110 int ipv6_dev_get_saddr(struct net *net, struct net_device *dst_dev,
1111 		       const struct in6_addr *daddr, unsigned int prefs,
1112 		       struct in6_addr *saddr)
1113 {
1114 	struct ipv6_saddr_score scores[2],
1115 				*score = &scores[0], *hiscore = &scores[1];
1116 	struct ipv6_saddr_dst dst;
1117 	struct net_device *dev;
1118 	int dst_type;
1119 
1120 	dst_type = __ipv6_addr_type(daddr);
1121 	dst.addr = daddr;
1122 	dst.ifindex = dst_dev ? dst_dev->ifindex : 0;
1123 	dst.scope = __ipv6_addr_src_scope(dst_type);
1124 	dst.label = ipv6_addr_label(net, daddr, dst_type, dst.ifindex);
1125 	dst.prefs = prefs;
1126 
1127 	hiscore->rule = -1;
1128 	hiscore->ifa = NULL;
1129 
1130 	rcu_read_lock();
1131 
1132 	for_each_netdev_rcu(net, dev) {
1133 		struct inet6_dev *idev;
1134 
1135 		/* Candidate Source Address (section 4)
1136 		 *  - multicast and link-local destination address,
1137 		 *    the set of candidate source address MUST only
1138 		 *    include addresses assigned to interfaces
1139 		 *    belonging to the same link as the outgoing
1140 		 *    interface.
1141 		 * (- For site-local destination addresses, the
1142 		 *    set of candidate source addresses MUST only
1143 		 *    include addresses assigned to interfaces
1144 		 *    belonging to the same site as the outgoing
1145 		 *    interface.)
1146 		 */
1147 		if (((dst_type & IPV6_ADDR_MULTICAST) ||
1148 		     dst.scope <= IPV6_ADDR_SCOPE_LINKLOCAL) &&
1149 		    dst.ifindex && dev->ifindex != dst.ifindex)
1150 			continue;
1151 
1152 		idev = __in6_dev_get(dev);
1153 		if (!idev)
1154 			continue;
1155 
1156 		read_lock_bh(&idev->lock);
1157 		list_for_each_entry(score->ifa, &idev->addr_list, if_list) {
1158 			int i;
1159 
1160 			/*
1161 			 * - Tentative Address (RFC2462 section 5.4)
1162 			 *  - A tentative address is not considered
1163 			 *    "assigned to an interface" in the traditional
1164 			 *    sense, unless it is also flagged as optimistic.
1165 			 * - Candidate Source Address (section 4)
1166 			 *  - In any case, anycast addresses, multicast
1167 			 *    addresses, and the unspecified address MUST
1168 			 *    NOT be included in a candidate set.
1169 			 */
1170 			if ((score->ifa->flags & IFA_F_TENTATIVE) &&
1171 			    (!(score->ifa->flags & IFA_F_OPTIMISTIC)))
1172 				continue;
1173 
1174 			score->addr_type = __ipv6_addr_type(&score->ifa->addr);
1175 
1176 			if (unlikely(score->addr_type == IPV6_ADDR_ANY ||
1177 				     score->addr_type & IPV6_ADDR_MULTICAST)) {
1178 				LIMIT_NETDEBUG(KERN_DEBUG
1179 					       "ADDRCONF: unspecified / multicast address "
1180 					       "assigned as unicast address on %s",
1181 					       dev->name);
1182 				continue;
1183 			}
1184 
1185 			score->rule = -1;
1186 			bitmap_zero(score->scorebits, IPV6_SADDR_RULE_MAX);
1187 
1188 			for (i = 0; i < IPV6_SADDR_RULE_MAX; i++) {
1189 				int minihiscore, miniscore;
1190 
1191 				minihiscore = ipv6_get_saddr_eval(net, hiscore, &dst, i);
1192 				miniscore = ipv6_get_saddr_eval(net, score, &dst, i);
1193 
1194 				if (minihiscore > miniscore) {
1195 					if (i == IPV6_SADDR_RULE_SCOPE &&
1196 					    score->scopedist > 0) {
1197 						/*
1198 						 * special case:
1199 						 * each remaining entry
1200 						 * has too small (not enough)
1201 						 * scope, because ifa entries
1202 						 * are sorted by their scope
1203 						 * values.
1204 						 */
1205 						goto try_nextdev;
1206 					}
1207 					break;
1208 				} else if (minihiscore < miniscore) {
1209 					if (hiscore->ifa)
1210 						in6_ifa_put(hiscore->ifa);
1211 
1212 					in6_ifa_hold(score->ifa);
1213 
1214 					swap(hiscore, score);
1215 
1216 					/* restore our iterator */
1217 					score->ifa = hiscore->ifa;
1218 
1219 					break;
1220 				}
1221 			}
1222 		}
1223 try_nextdev:
1224 		read_unlock_bh(&idev->lock);
1225 	}
1226 	rcu_read_unlock();
1227 
1228 	if (!hiscore->ifa)
1229 		return -EADDRNOTAVAIL;
1230 
1231 	*saddr = hiscore->ifa->addr;
1232 	in6_ifa_put(hiscore->ifa);
1233 	return 0;
1234 }
1235 EXPORT_SYMBOL(ipv6_dev_get_saddr);
1236 
__ipv6_get_lladdr(struct inet6_dev * idev,struct in6_addr * addr,unsigned char banned_flags)1237 int __ipv6_get_lladdr(struct inet6_dev *idev, struct in6_addr *addr,
1238 		      unsigned char banned_flags)
1239 {
1240 	struct inet6_ifaddr *ifp;
1241 	int err = -EADDRNOTAVAIL;
1242 
1243 	list_for_each_entry(ifp, &idev->addr_list, if_list) {
1244 		if (ifp->scope == IFA_LINK &&
1245 		    !(ifp->flags & banned_flags)) {
1246 			*addr = ifp->addr;
1247 			err = 0;
1248 			break;
1249 		}
1250 	}
1251 	return err;
1252 }
1253 
ipv6_get_lladdr(struct net_device * dev,struct in6_addr * addr,unsigned char banned_flags)1254 int ipv6_get_lladdr(struct net_device *dev, struct in6_addr *addr,
1255 		    unsigned char banned_flags)
1256 {
1257 	struct inet6_dev *idev;
1258 	int err = -EADDRNOTAVAIL;
1259 
1260 	rcu_read_lock();
1261 	idev = __in6_dev_get(dev);
1262 	if (idev) {
1263 		read_lock_bh(&idev->lock);
1264 		err = __ipv6_get_lladdr(idev, addr, banned_flags);
1265 		read_unlock_bh(&idev->lock);
1266 	}
1267 	rcu_read_unlock();
1268 	return err;
1269 }
1270 
ipv6_count_addresses(struct inet6_dev * idev)1271 static int ipv6_count_addresses(struct inet6_dev *idev)
1272 {
1273 	int cnt = 0;
1274 	struct inet6_ifaddr *ifp;
1275 
1276 	read_lock_bh(&idev->lock);
1277 	list_for_each_entry(ifp, &idev->addr_list, if_list)
1278 		cnt++;
1279 	read_unlock_bh(&idev->lock);
1280 	return cnt;
1281 }
1282 
ipv6_chk_addr(struct net * net,const struct in6_addr * addr,struct net_device * dev,int strict)1283 int ipv6_chk_addr(struct net *net, const struct in6_addr *addr,
1284 		  struct net_device *dev, int strict)
1285 {
1286 	struct inet6_ifaddr *ifp;
1287 	struct hlist_node *node;
1288 	unsigned int hash = ipv6_addr_hash(addr);
1289 
1290 	rcu_read_lock_bh();
1291 	hlist_for_each_entry_rcu(ifp, node, &inet6_addr_lst[hash], addr_lst) {
1292 		if (!net_eq(dev_net(ifp->idev->dev), net))
1293 			continue;
1294 		if (ipv6_addr_equal(&ifp->addr, addr) &&
1295 		    !(ifp->flags&IFA_F_TENTATIVE) &&
1296 		    (dev == NULL || ifp->idev->dev == dev ||
1297 		     !(ifp->scope&(IFA_LINK|IFA_HOST) || strict))) {
1298 			rcu_read_unlock_bh();
1299 			return 1;
1300 		}
1301 	}
1302 
1303 	rcu_read_unlock_bh();
1304 	return 0;
1305 }
1306 EXPORT_SYMBOL(ipv6_chk_addr);
1307 
ipv6_chk_same_addr(struct net * net,const struct in6_addr * addr,struct net_device * dev)1308 static bool ipv6_chk_same_addr(struct net *net, const struct in6_addr *addr,
1309 			       struct net_device *dev)
1310 {
1311 	unsigned int hash = ipv6_addr_hash(addr);
1312 	struct inet6_ifaddr *ifp;
1313 	struct hlist_node *node;
1314 
1315 	hlist_for_each_entry(ifp, node, &inet6_addr_lst[hash], addr_lst) {
1316 		if (!net_eq(dev_net(ifp->idev->dev), net))
1317 			continue;
1318 		if (ipv6_addr_equal(&ifp->addr, addr)) {
1319 			if (dev == NULL || ifp->idev->dev == dev)
1320 				return true;
1321 		}
1322 	}
1323 	return false;
1324 }
1325 
ipv6_chk_prefix(const struct in6_addr * addr,struct net_device * dev)1326 int ipv6_chk_prefix(const struct in6_addr *addr, struct net_device *dev)
1327 {
1328 	struct inet6_dev *idev;
1329 	struct inet6_ifaddr *ifa;
1330 	int	onlink;
1331 
1332 	onlink = 0;
1333 	rcu_read_lock();
1334 	idev = __in6_dev_get(dev);
1335 	if (idev) {
1336 		read_lock_bh(&idev->lock);
1337 		list_for_each_entry(ifa, &idev->addr_list, if_list) {
1338 			onlink = ipv6_prefix_equal(addr, &ifa->addr,
1339 						   ifa->prefix_len);
1340 			if (onlink)
1341 				break;
1342 		}
1343 		read_unlock_bh(&idev->lock);
1344 	}
1345 	rcu_read_unlock();
1346 	return onlink;
1347 }
1348 
1349 EXPORT_SYMBOL(ipv6_chk_prefix);
1350 
ipv6_get_ifaddr(struct net * net,const struct in6_addr * addr,struct net_device * dev,int strict)1351 struct inet6_ifaddr *ipv6_get_ifaddr(struct net *net, const struct in6_addr *addr,
1352 				     struct net_device *dev, int strict)
1353 {
1354 	struct inet6_ifaddr *ifp, *result = NULL;
1355 	unsigned int hash = ipv6_addr_hash(addr);
1356 	struct hlist_node *node;
1357 
1358 	rcu_read_lock_bh();
1359 	hlist_for_each_entry_rcu_bh(ifp, node, &inet6_addr_lst[hash], addr_lst) {
1360 		if (!net_eq(dev_net(ifp->idev->dev), net))
1361 			continue;
1362 		if (ipv6_addr_equal(&ifp->addr, addr)) {
1363 			if (dev == NULL || ifp->idev->dev == dev ||
1364 			    !(ifp->scope&(IFA_LINK|IFA_HOST) || strict)) {
1365 				result = ifp;
1366 				in6_ifa_hold(ifp);
1367 				break;
1368 			}
1369 		}
1370 	}
1371 	rcu_read_unlock_bh();
1372 
1373 	return result;
1374 }
1375 
1376 /* Gets referenced address, destroys ifaddr */
1377 
addrconf_dad_stop(struct inet6_ifaddr * ifp,int dad_failed)1378 static void addrconf_dad_stop(struct inet6_ifaddr *ifp, int dad_failed)
1379 {
1380 	if (ifp->flags&IFA_F_PERMANENT) {
1381 		spin_lock_bh(&ifp->lock);
1382 		addrconf_del_timer(ifp);
1383 		ifp->flags |= IFA_F_TENTATIVE;
1384 		if (dad_failed)
1385 			ifp->flags |= IFA_F_DADFAILED;
1386 		spin_unlock_bh(&ifp->lock);
1387 		if (dad_failed)
1388 			ipv6_ifa_notify(0, ifp);
1389 		in6_ifa_put(ifp);
1390 #ifdef CONFIG_IPV6_PRIVACY
1391 	} else if (ifp->flags&IFA_F_TEMPORARY) {
1392 		struct inet6_ifaddr *ifpub;
1393 		spin_lock_bh(&ifp->lock);
1394 		ifpub = ifp->ifpub;
1395 		if (ifpub) {
1396 			in6_ifa_hold(ifpub);
1397 			spin_unlock_bh(&ifp->lock);
1398 			ipv6_create_tempaddr(ifpub, ifp);
1399 			in6_ifa_put(ifpub);
1400 		} else {
1401 			spin_unlock_bh(&ifp->lock);
1402 		}
1403 		ipv6_del_addr(ifp);
1404 #endif
1405 	} else
1406 		ipv6_del_addr(ifp);
1407 }
1408 
addrconf_dad_end(struct inet6_ifaddr * ifp)1409 static int addrconf_dad_end(struct inet6_ifaddr *ifp)
1410 {
1411 	int err = -ENOENT;
1412 
1413 	spin_lock(&ifp->state_lock);
1414 	if (ifp->state == INET6_IFADDR_STATE_DAD) {
1415 		ifp->state = INET6_IFADDR_STATE_POSTDAD;
1416 		err = 0;
1417 	}
1418 	spin_unlock(&ifp->state_lock);
1419 
1420 	return err;
1421 }
1422 
addrconf_dad_failure(struct inet6_ifaddr * ifp)1423 void addrconf_dad_failure(struct inet6_ifaddr *ifp)
1424 {
1425 	struct inet6_dev *idev = ifp->idev;
1426 
1427 	if (addrconf_dad_end(ifp)) {
1428 		in6_ifa_put(ifp);
1429 		return;
1430 	}
1431 
1432 	if (net_ratelimit())
1433 		printk(KERN_INFO "%s: IPv6 duplicate address %pI6c detected!\n",
1434 			ifp->idev->dev->name, &ifp->addr);
1435 
1436 	if (idev->cnf.accept_dad > 1 && !idev->cnf.disable_ipv6) {
1437 		struct in6_addr addr;
1438 
1439 		addr.s6_addr32[0] = htonl(0xfe800000);
1440 		addr.s6_addr32[1] = 0;
1441 
1442 		if (!ipv6_generate_eui64(addr.s6_addr + 8, idev->dev) &&
1443 		    ipv6_addr_equal(&ifp->addr, &addr)) {
1444 			/* DAD failed for link-local based on MAC address */
1445 			idev->cnf.disable_ipv6 = 1;
1446 
1447 			printk(KERN_INFO "%s: IPv6 being disabled!\n",
1448 				ifp->idev->dev->name);
1449 		}
1450 	}
1451 
1452 	addrconf_dad_stop(ifp, 1);
1453 }
1454 
1455 /* Join to solicited addr multicast group. */
1456 
addrconf_join_solict(struct net_device * dev,const struct in6_addr * addr)1457 void addrconf_join_solict(struct net_device *dev, const struct in6_addr *addr)
1458 {
1459 	struct in6_addr maddr;
1460 
1461 	if (dev->flags&(IFF_LOOPBACK|IFF_NOARP))
1462 		return;
1463 
1464 	addrconf_addr_solict_mult(addr, &maddr);
1465 	ipv6_dev_mc_inc(dev, &maddr);
1466 }
1467 
addrconf_leave_solict(struct inet6_dev * idev,const struct in6_addr * addr)1468 void addrconf_leave_solict(struct inet6_dev *idev, const struct in6_addr *addr)
1469 {
1470 	struct in6_addr maddr;
1471 
1472 	if (idev->dev->flags&(IFF_LOOPBACK|IFF_NOARP))
1473 		return;
1474 
1475 	addrconf_addr_solict_mult(addr, &maddr);
1476 	__ipv6_dev_mc_dec(idev, &maddr);
1477 }
1478 
addrconf_join_anycast(struct inet6_ifaddr * ifp)1479 static void addrconf_join_anycast(struct inet6_ifaddr *ifp)
1480 {
1481 	struct in6_addr addr;
1482 	if (ifp->prefix_len == 127) /* RFC 6164 */
1483 		return;
1484 	ipv6_addr_prefix(&addr, &ifp->addr, ifp->prefix_len);
1485 	if (ipv6_addr_any(&addr))
1486 		return;
1487 	ipv6_dev_ac_inc(ifp->idev->dev, &addr);
1488 }
1489 
addrconf_leave_anycast(struct inet6_ifaddr * ifp)1490 static void addrconf_leave_anycast(struct inet6_ifaddr *ifp)
1491 {
1492 	struct in6_addr addr;
1493 	if (ifp->prefix_len == 127) /* RFC 6164 */
1494 		return;
1495 	ipv6_addr_prefix(&addr, &ifp->addr, ifp->prefix_len);
1496 	if (ipv6_addr_any(&addr))
1497 		return;
1498 	__ipv6_dev_ac_dec(ifp->idev, &addr);
1499 }
1500 
addrconf_ifid_eui48(u8 * eui,struct net_device * dev)1501 static int addrconf_ifid_eui48(u8 *eui, struct net_device *dev)
1502 {
1503 	if (dev->addr_len != ETH_ALEN)
1504 		return -1;
1505 	memcpy(eui, dev->dev_addr, 3);
1506 	memcpy(eui + 5, dev->dev_addr + 3, 3);
1507 
1508 	/*
1509 	 * The zSeries OSA network cards can be shared among various
1510 	 * OS instances, but the OSA cards have only one MAC address.
1511 	 * This leads to duplicate address conflicts in conjunction
1512 	 * with IPv6 if more than one instance uses the same card.
1513 	 *
1514 	 * The driver for these cards can deliver a unique 16-bit
1515 	 * identifier for each instance sharing the same card.  It is
1516 	 * placed instead of 0xFFFE in the interface identifier.  The
1517 	 * "u" bit of the interface identifier is not inverted in this
1518 	 * case.  Hence the resulting interface identifier has local
1519 	 * scope according to RFC2373.
1520 	 */
1521 	if (dev->dev_id) {
1522 		eui[3] = (dev->dev_id >> 8) & 0xFF;
1523 		eui[4] = dev->dev_id & 0xFF;
1524 	} else {
1525 		eui[3] = 0xFF;
1526 		eui[4] = 0xFE;
1527 		eui[0] ^= 2;
1528 	}
1529 	return 0;
1530 }
1531 
addrconf_ifid_arcnet(u8 * eui,struct net_device * dev)1532 static int addrconf_ifid_arcnet(u8 *eui, struct net_device *dev)
1533 {
1534 	/* XXX: inherit EUI-64 from other interface -- yoshfuji */
1535 	if (dev->addr_len != ARCNET_ALEN)
1536 		return -1;
1537 	memset(eui, 0, 7);
1538 	eui[7] = *(u8*)dev->dev_addr;
1539 	return 0;
1540 }
1541 
addrconf_ifid_infiniband(u8 * eui,struct net_device * dev)1542 static int addrconf_ifid_infiniband(u8 *eui, struct net_device *dev)
1543 {
1544 	if (dev->addr_len != INFINIBAND_ALEN)
1545 		return -1;
1546 	memcpy(eui, dev->dev_addr + 12, 8);
1547 	eui[0] |= 2;
1548 	return 0;
1549 }
1550 
__ipv6_isatap_ifid(u8 * eui,__be32 addr)1551 static int __ipv6_isatap_ifid(u8 *eui, __be32 addr)
1552 {
1553 	if (addr == 0)
1554 		return -1;
1555 	eui[0] = (ipv4_is_zeronet(addr) || ipv4_is_private_10(addr) ||
1556 		  ipv4_is_loopback(addr) || ipv4_is_linklocal_169(addr) ||
1557 		  ipv4_is_private_172(addr) || ipv4_is_test_192(addr) ||
1558 		  ipv4_is_anycast_6to4(addr) || ipv4_is_private_192(addr) ||
1559 		  ipv4_is_test_198(addr) || ipv4_is_multicast(addr) ||
1560 		  ipv4_is_lbcast(addr)) ? 0x00 : 0x02;
1561 	eui[1] = 0;
1562 	eui[2] = 0x5E;
1563 	eui[3] = 0xFE;
1564 	memcpy(eui + 4, &addr, 4);
1565 	return 0;
1566 }
1567 
addrconf_ifid_sit(u8 * eui,struct net_device * dev)1568 static int addrconf_ifid_sit(u8 *eui, struct net_device *dev)
1569 {
1570 	if (dev->priv_flags & IFF_ISATAP)
1571 		return __ipv6_isatap_ifid(eui, *(__be32 *)dev->dev_addr);
1572 	return -1;
1573 }
1574 
addrconf_ifid_gre(u8 * eui,struct net_device * dev)1575 static int addrconf_ifid_gre(u8 *eui, struct net_device *dev)
1576 {
1577 	return __ipv6_isatap_ifid(eui, *(__be32 *)dev->dev_addr);
1578 }
1579 
ipv6_generate_eui64(u8 * eui,struct net_device * dev)1580 static int ipv6_generate_eui64(u8 *eui, struct net_device *dev)
1581 {
1582 	switch (dev->type) {
1583 	case ARPHRD_ETHER:
1584 	case ARPHRD_FDDI:
1585 	case ARPHRD_IEEE802_TR:
1586 		return addrconf_ifid_eui48(eui, dev);
1587 	case ARPHRD_ARCNET:
1588 		return addrconf_ifid_arcnet(eui, dev);
1589 	case ARPHRD_INFINIBAND:
1590 		return addrconf_ifid_infiniband(eui, dev);
1591 	case ARPHRD_SIT:
1592 		return addrconf_ifid_sit(eui, dev);
1593 	case ARPHRD_IPGRE:
1594 		return addrconf_ifid_gre(eui, dev);
1595 	}
1596 	return -1;
1597 }
1598 
ipv6_inherit_eui64(u8 * eui,struct inet6_dev * idev)1599 static int ipv6_inherit_eui64(u8 *eui, struct inet6_dev *idev)
1600 {
1601 	int err = -1;
1602 	struct inet6_ifaddr *ifp;
1603 
1604 	read_lock_bh(&idev->lock);
1605 	list_for_each_entry(ifp, &idev->addr_list, if_list) {
1606 		if (ifp->scope == IFA_LINK && !(ifp->flags&IFA_F_TENTATIVE)) {
1607 			memcpy(eui, ifp->addr.s6_addr+8, 8);
1608 			err = 0;
1609 			break;
1610 		}
1611 	}
1612 	read_unlock_bh(&idev->lock);
1613 	return err;
1614 }
1615 
1616 #ifdef CONFIG_IPV6_PRIVACY
1617 /* (re)generation of randomized interface identifier (RFC 3041 3.2, 3.5) */
__ipv6_regen_rndid(struct inet6_dev * idev)1618 static int __ipv6_regen_rndid(struct inet6_dev *idev)
1619 {
1620 regen:
1621 	get_random_bytes(idev->rndid, sizeof(idev->rndid));
1622 	idev->rndid[0] &= ~0x02;
1623 
1624 	/*
1625 	 * <draft-ietf-ipngwg-temp-addresses-v2-00.txt>:
1626 	 * check if generated address is not inappropriate
1627 	 *
1628 	 *  - Reserved subnet anycast (RFC 2526)
1629 	 *	11111101 11....11 1xxxxxxx
1630 	 *  - ISATAP (RFC4214) 6.1
1631 	 *	00-00-5E-FE-xx-xx-xx-xx
1632 	 *  - value 0
1633 	 *  - XXX: already assigned to an address on the device
1634 	 */
1635 	if (idev->rndid[0] == 0xfd &&
1636 	    (idev->rndid[1]&idev->rndid[2]&idev->rndid[3]&idev->rndid[4]&idev->rndid[5]&idev->rndid[6]) == 0xff &&
1637 	    (idev->rndid[7]&0x80))
1638 		goto regen;
1639 	if ((idev->rndid[0]|idev->rndid[1]) == 0) {
1640 		if (idev->rndid[2] == 0x5e && idev->rndid[3] == 0xfe)
1641 			goto regen;
1642 		if ((idev->rndid[2]|idev->rndid[3]|idev->rndid[4]|idev->rndid[5]|idev->rndid[6]|idev->rndid[7]) == 0x00)
1643 			goto regen;
1644 	}
1645 
1646 	return 0;
1647 }
1648 
ipv6_regen_rndid(unsigned long data)1649 static void ipv6_regen_rndid(unsigned long data)
1650 {
1651 	struct inet6_dev *idev = (struct inet6_dev *) data;
1652 	unsigned long expires;
1653 
1654 	rcu_read_lock_bh();
1655 	write_lock_bh(&idev->lock);
1656 
1657 	if (idev->dead)
1658 		goto out;
1659 
1660 	if (__ipv6_regen_rndid(idev) < 0)
1661 		goto out;
1662 
1663 	expires = jiffies +
1664 		idev->cnf.temp_prefered_lft * HZ -
1665 		idev->cnf.regen_max_retry * idev->cnf.dad_transmits * idev->nd_parms->retrans_time -
1666 		idev->cnf.max_desync_factor * HZ;
1667 	if (time_before(expires, jiffies)) {
1668 		printk(KERN_WARNING
1669 			"ipv6_regen_rndid(): too short regeneration interval; timer disabled for %s.\n",
1670 			idev->dev->name);
1671 		goto out;
1672 	}
1673 
1674 	if (!mod_timer(&idev->regen_timer, expires))
1675 		in6_dev_hold(idev);
1676 
1677 out:
1678 	write_unlock_bh(&idev->lock);
1679 	rcu_read_unlock_bh();
1680 	in6_dev_put(idev);
1681 }
1682 
__ipv6_try_regen_rndid(struct inet6_dev * idev,struct in6_addr * tmpaddr)1683 static int __ipv6_try_regen_rndid(struct inet6_dev *idev, struct in6_addr *tmpaddr) {
1684 	int ret = 0;
1685 
1686 	if (tmpaddr && memcmp(idev->rndid, &tmpaddr->s6_addr[8], 8) == 0)
1687 		ret = __ipv6_regen_rndid(idev);
1688 	return ret;
1689 }
1690 #endif
1691 
1692 /*
1693  *	Add prefix route.
1694  */
1695 
1696 static void
addrconf_prefix_route(struct in6_addr * pfx,int plen,struct net_device * dev,unsigned long expires,u32 flags)1697 addrconf_prefix_route(struct in6_addr *pfx, int plen, struct net_device *dev,
1698 		      unsigned long expires, u32 flags)
1699 {
1700 	struct fib6_config cfg = {
1701 		.fc_table = RT6_TABLE_PREFIX,
1702 		.fc_metric = IP6_RT_PRIO_ADDRCONF,
1703 		.fc_ifindex = dev->ifindex,
1704 		.fc_expires = expires,
1705 		.fc_dst_len = plen,
1706 		.fc_flags = RTF_UP | flags,
1707 		.fc_nlinfo.nl_net = dev_net(dev),
1708 		.fc_protocol = RTPROT_KERNEL,
1709 	};
1710 
1711 	cfg.fc_dst = *pfx;
1712 
1713 	/* Prevent useless cloning on PtP SIT.
1714 	   This thing is done here expecting that the whole
1715 	   class of non-broadcast devices need not cloning.
1716 	 */
1717 #if defined(CONFIG_IPV6_SIT) || defined(CONFIG_IPV6_SIT_MODULE)
1718 	if (dev->type == ARPHRD_SIT && (dev->flags & IFF_POINTOPOINT))
1719 		cfg.fc_flags |= RTF_NONEXTHOP;
1720 #endif
1721 
1722 	ip6_route_add(&cfg);
1723 }
1724 
1725 
addrconf_get_prefix_route(const struct in6_addr * pfx,int plen,const struct net_device * dev,u32 flags,u32 noflags)1726 static struct rt6_info *addrconf_get_prefix_route(const struct in6_addr *pfx,
1727 						  int plen,
1728 						  const struct net_device *dev,
1729 						  u32 flags, u32 noflags)
1730 {
1731 	struct fib6_node *fn;
1732 	struct rt6_info *rt = NULL;
1733 	struct fib6_table *table;
1734 
1735 	table = fib6_get_table(dev_net(dev), RT6_TABLE_PREFIX);
1736 	if (table == NULL)
1737 		return NULL;
1738 
1739 	write_lock_bh(&table->tb6_lock);
1740 	fn = fib6_locate(&table->tb6_root, pfx, plen, NULL, 0);
1741 	if (!fn)
1742 		goto out;
1743 	for (rt = fn->leaf; rt; rt = rt->dst.rt6_next) {
1744 		if (rt->dst.dev->ifindex != dev->ifindex)
1745 			continue;
1746 		if ((rt->rt6i_flags & flags) != flags)
1747 			continue;
1748 		if ((rt->rt6i_flags & noflags) != 0)
1749 			continue;
1750 		dst_hold(&rt->dst);
1751 		break;
1752 	}
1753 out:
1754 	write_unlock_bh(&table->tb6_lock);
1755 	return rt;
1756 }
1757 
1758 
1759 /* Create "default" multicast route to the interface */
1760 
addrconf_add_mroute(struct net_device * dev)1761 static void addrconf_add_mroute(struct net_device *dev)
1762 {
1763 	struct fib6_config cfg = {
1764 		.fc_table = RT6_TABLE_LOCAL,
1765 		.fc_metric = IP6_RT_PRIO_ADDRCONF,
1766 		.fc_ifindex = dev->ifindex,
1767 		.fc_dst_len = 8,
1768 		.fc_flags = RTF_UP,
1769 		.fc_nlinfo.nl_net = dev_net(dev),
1770 	};
1771 
1772 	ipv6_addr_set(&cfg.fc_dst, htonl(0xFF000000), 0, 0, 0);
1773 
1774 	ip6_route_add(&cfg);
1775 }
1776 
1777 #if defined(CONFIG_IPV6_SIT) || defined(CONFIG_IPV6_SIT_MODULE)
sit_route_add(struct net_device * dev)1778 static void sit_route_add(struct net_device *dev)
1779 {
1780 	struct fib6_config cfg = {
1781 		.fc_table = RT6_TABLE_MAIN,
1782 		.fc_metric = IP6_RT_PRIO_ADDRCONF,
1783 		.fc_ifindex = dev->ifindex,
1784 		.fc_dst_len = 96,
1785 		.fc_flags = RTF_UP | RTF_NONEXTHOP,
1786 		.fc_nlinfo.nl_net = dev_net(dev),
1787 	};
1788 
1789 	/* prefix length - 96 bits "::d.d.d.d" */
1790 	ip6_route_add(&cfg);
1791 }
1792 #endif
1793 
addrconf_add_lroute(struct net_device * dev)1794 static void addrconf_add_lroute(struct net_device *dev)
1795 {
1796 	struct in6_addr addr;
1797 
1798 	ipv6_addr_set(&addr,  htonl(0xFE800000), 0, 0, 0);
1799 	addrconf_prefix_route(&addr, 64, dev, 0, 0);
1800 }
1801 
addrconf_add_dev(struct net_device * dev)1802 static struct inet6_dev *addrconf_add_dev(struct net_device *dev)
1803 {
1804 	struct inet6_dev *idev;
1805 
1806 	ASSERT_RTNL();
1807 
1808 	idev = ipv6_find_idev(dev);
1809 	if (!idev)
1810 		return ERR_PTR(-ENOBUFS);
1811 
1812 	if (idev->cnf.disable_ipv6)
1813 		return ERR_PTR(-EACCES);
1814 
1815 	/* Add default multicast route */
1816 	if (!(dev->flags & IFF_LOOPBACK))
1817 		addrconf_add_mroute(dev);
1818 
1819 	/* Add link local route */
1820 	addrconf_add_lroute(dev);
1821 	return idev;
1822 }
1823 
addrconf_prefix_rcv(struct net_device * dev,u8 * opt,int len,bool sllao)1824 void addrconf_prefix_rcv(struct net_device *dev, u8 *opt, int len, bool sllao)
1825 {
1826 	struct prefix_info *pinfo;
1827 	__u32 valid_lft;
1828 	__u32 prefered_lft;
1829 	int addr_type;
1830 	struct inet6_dev *in6_dev;
1831 	struct net *net = dev_net(dev);
1832 
1833 	pinfo = (struct prefix_info *) opt;
1834 
1835 	if (len < sizeof(struct prefix_info)) {
1836 		ADBG(("addrconf: prefix option too short\n"));
1837 		return;
1838 	}
1839 
1840 	/*
1841 	 *	Validation checks ([ADDRCONF], page 19)
1842 	 */
1843 
1844 	addr_type = ipv6_addr_type(&pinfo->prefix);
1845 
1846 	if (addr_type & (IPV6_ADDR_MULTICAST|IPV6_ADDR_LINKLOCAL))
1847 		return;
1848 
1849 	valid_lft = ntohl(pinfo->valid);
1850 	prefered_lft = ntohl(pinfo->prefered);
1851 
1852 	if (prefered_lft > valid_lft) {
1853 		if (net_ratelimit())
1854 			printk(KERN_WARNING "addrconf: prefix option has invalid lifetime\n");
1855 		return;
1856 	}
1857 
1858 	in6_dev = in6_dev_get(dev);
1859 
1860 	if (in6_dev == NULL) {
1861 		if (net_ratelimit())
1862 			printk(KERN_DEBUG "addrconf: device %s not configured\n", dev->name);
1863 		return;
1864 	}
1865 
1866 	/*
1867 	 *	Two things going on here:
1868 	 *	1) Add routes for on-link prefixes
1869 	 *	2) Configure prefixes with the auto flag set
1870 	 */
1871 
1872 	if (pinfo->onlink) {
1873 		struct rt6_info *rt;
1874 		unsigned long rt_expires;
1875 
1876 		/* Avoid arithmetic overflow. Really, we could
1877 		 * save rt_expires in seconds, likely valid_lft,
1878 		 * but it would require division in fib gc, that it
1879 		 * not good.
1880 		 */
1881 		if (HZ > USER_HZ)
1882 			rt_expires = addrconf_timeout_fixup(valid_lft, HZ);
1883 		else
1884 			rt_expires = addrconf_timeout_fixup(valid_lft, USER_HZ);
1885 
1886 		if (addrconf_finite_timeout(rt_expires))
1887 			rt_expires *= HZ;
1888 
1889 		rt = addrconf_get_prefix_route(&pinfo->prefix,
1890 					       pinfo->prefix_len,
1891 					       dev,
1892 					       RTF_ADDRCONF | RTF_PREFIX_RT,
1893 					       RTF_GATEWAY | RTF_DEFAULT);
1894 
1895 		if (rt) {
1896 			/* Autoconf prefix route */
1897 			if (valid_lft == 0) {
1898 				ip6_del_rt(rt);
1899 				rt = NULL;
1900 			} else if (addrconf_finite_timeout(rt_expires)) {
1901 				/* not infinity */
1902 				rt6_set_expires(rt, jiffies + rt_expires);
1903 			} else {
1904 				rt6_clean_expires(rt);
1905 			}
1906 		} else if (valid_lft) {
1907 			clock_t expires = 0;
1908 			int flags = RTF_ADDRCONF | RTF_PREFIX_RT;
1909 			if (addrconf_finite_timeout(rt_expires)) {
1910 				/* not infinity */
1911 				flags |= RTF_EXPIRES;
1912 				expires = jiffies_to_clock_t(rt_expires);
1913 			}
1914 			addrconf_prefix_route(&pinfo->prefix, pinfo->prefix_len,
1915 					      dev, expires, flags);
1916 		}
1917 		if (rt)
1918 			dst_release(&rt->dst);
1919 	}
1920 
1921 	/* Try to figure out our local address for this prefix */
1922 
1923 	if (pinfo->autoconf && in6_dev->cnf.autoconf) {
1924 		struct inet6_ifaddr * ifp;
1925 		struct in6_addr addr;
1926 		int create = 0, update_lft = 0;
1927 
1928 		if (pinfo->prefix_len == 64) {
1929 			memcpy(&addr, &pinfo->prefix, 8);
1930 			if (ipv6_generate_eui64(addr.s6_addr + 8, dev) &&
1931 			    ipv6_inherit_eui64(addr.s6_addr + 8, in6_dev)) {
1932 				in6_dev_put(in6_dev);
1933 				return;
1934 			}
1935 			goto ok;
1936 		}
1937 		if (net_ratelimit())
1938 			printk(KERN_DEBUG "IPv6 addrconf: prefix with wrong length %d\n",
1939 			       pinfo->prefix_len);
1940 		in6_dev_put(in6_dev);
1941 		return;
1942 
1943 ok:
1944 
1945 		ifp = ipv6_get_ifaddr(net, &addr, dev, 1);
1946 
1947 		if (ifp == NULL && valid_lft) {
1948 			int max_addresses = in6_dev->cnf.max_addresses;
1949 			u32 addr_flags = 0;
1950 
1951 #ifdef CONFIG_IPV6_OPTIMISTIC_DAD
1952 			if (in6_dev->cnf.optimistic_dad &&
1953 			    !net->ipv6.devconf_all->forwarding && sllao)
1954 				addr_flags = IFA_F_OPTIMISTIC;
1955 #endif
1956 
1957 			/* Do not allow to create too much of autoconfigured
1958 			 * addresses; this would be too easy way to crash kernel.
1959 			 */
1960 			if (!max_addresses ||
1961 			    ipv6_count_addresses(in6_dev) < max_addresses)
1962 				ifp = ipv6_add_addr(in6_dev, &addr, pinfo->prefix_len,
1963 						    addr_type&IPV6_ADDR_SCOPE_MASK,
1964 						    addr_flags);
1965 
1966 			if (!ifp || IS_ERR(ifp)) {
1967 				in6_dev_put(in6_dev);
1968 				return;
1969 			}
1970 
1971 			update_lft = create = 1;
1972 			ifp->cstamp = jiffies;
1973 			addrconf_dad_start(ifp, RTF_ADDRCONF|RTF_PREFIX_RT);
1974 		}
1975 
1976 		if (ifp) {
1977 			int flags;
1978 			unsigned long now;
1979 #ifdef CONFIG_IPV6_PRIVACY
1980 			struct inet6_ifaddr *ift;
1981 #endif
1982 			u32 stored_lft;
1983 
1984 			/* update lifetime (RFC2462 5.5.3 e) */
1985 			spin_lock(&ifp->lock);
1986 			now = jiffies;
1987 			if (ifp->valid_lft > (now - ifp->tstamp) / HZ)
1988 				stored_lft = ifp->valid_lft - (now - ifp->tstamp) / HZ;
1989 			else
1990 				stored_lft = 0;
1991 			if (!update_lft && stored_lft) {
1992 				if (valid_lft > MIN_VALID_LIFETIME ||
1993 				    valid_lft > stored_lft)
1994 					update_lft = 1;
1995 				else if (stored_lft <= MIN_VALID_LIFETIME) {
1996 					/* valid_lft <= stored_lft is always true */
1997 					/*
1998 					 * RFC 4862 Section 5.5.3e:
1999 					 * "Note that the preferred lifetime of
2000 					 *  the corresponding address is always
2001 					 *  reset to the Preferred Lifetime in
2002 					 *  the received Prefix Information
2003 					 *  option, regardless of whether the
2004 					 *  valid lifetime is also reset or
2005 					 *  ignored."
2006 					 *
2007 					 *  So if the preferred lifetime in
2008 					 *  this advertisement is different
2009 					 *  than what we have stored, but the
2010 					 *  valid lifetime is invalid, just
2011 					 *  reset prefered_lft.
2012 					 *
2013 					 *  We must set the valid lifetime
2014 					 *  to the stored lifetime since we'll
2015 					 *  be updating the timestamp below,
2016 					 *  else we'll set it back to the
2017 					 *  minimum.
2018 					 */
2019 					if (prefered_lft != ifp->prefered_lft) {
2020 						valid_lft = stored_lft;
2021 						update_lft = 1;
2022 					}
2023 				} else {
2024 					valid_lft = MIN_VALID_LIFETIME;
2025 					if (valid_lft < prefered_lft)
2026 						prefered_lft = valid_lft;
2027 					update_lft = 1;
2028 				}
2029 			}
2030 
2031 			if (update_lft) {
2032 				ifp->valid_lft = valid_lft;
2033 				ifp->prefered_lft = prefered_lft;
2034 				ifp->tstamp = now;
2035 				flags = ifp->flags;
2036 				ifp->flags &= ~IFA_F_DEPRECATED;
2037 				spin_unlock(&ifp->lock);
2038 
2039 				if (!(flags&IFA_F_TENTATIVE))
2040 					ipv6_ifa_notify(0, ifp);
2041 			} else
2042 				spin_unlock(&ifp->lock);
2043 
2044 #ifdef CONFIG_IPV6_PRIVACY
2045 			read_lock_bh(&in6_dev->lock);
2046 			/* update all temporary addresses in the list */
2047 			list_for_each_entry(ift, &in6_dev->tempaddr_list,
2048 					    tmp_list) {
2049 				int age, max_valid, max_prefered;
2050 
2051 				if (ifp != ift->ifpub)
2052 					continue;
2053 
2054 				/*
2055 				 * RFC 4941 section 3.3:
2056 				 * If a received option will extend the lifetime
2057 				 * of a public address, the lifetimes of
2058 				 * temporary addresses should be extended,
2059 				 * subject to the overall constraint that no
2060 				 * temporary addresses should ever remain
2061 				 * "valid" or "preferred" for a time longer than
2062 				 * (TEMP_VALID_LIFETIME) or
2063 				 * (TEMP_PREFERRED_LIFETIME - DESYNC_FACTOR),
2064 				 * respectively.
2065 				 */
2066 				age = (now - ift->cstamp) / HZ;
2067 				max_valid = in6_dev->cnf.temp_valid_lft - age;
2068 				if (max_valid < 0)
2069 					max_valid = 0;
2070 
2071 				max_prefered = in6_dev->cnf.temp_prefered_lft -
2072 					       in6_dev->cnf.max_desync_factor -
2073 					       age;
2074 				if (max_prefered < 0)
2075 					max_prefered = 0;
2076 
2077 				if (valid_lft > max_valid)
2078 					valid_lft = max_valid;
2079 
2080 				if (prefered_lft > max_prefered)
2081 					prefered_lft = max_prefered;
2082 
2083 				spin_lock(&ift->lock);
2084 				flags = ift->flags;
2085 				ift->valid_lft = valid_lft;
2086 				ift->prefered_lft = prefered_lft;
2087 				ift->tstamp = now;
2088 				if (prefered_lft > 0)
2089 					ift->flags &= ~IFA_F_DEPRECATED;
2090 
2091 				spin_unlock(&ift->lock);
2092 				if (!(flags&IFA_F_TENTATIVE))
2093 					ipv6_ifa_notify(0, ift);
2094 			}
2095 
2096 			if ((create || list_empty(&in6_dev->tempaddr_list)) && in6_dev->cnf.use_tempaddr > 0) {
2097 				/*
2098 				 * When a new public address is created as
2099 				 * described in [ADDRCONF], also create a new
2100 				 * temporary address. Also create a temporary
2101 				 * address if it's enabled but no temporary
2102 				 * address currently exists.
2103 				 */
2104 				read_unlock_bh(&in6_dev->lock);
2105 				ipv6_create_tempaddr(ifp, NULL);
2106 			} else {
2107 				read_unlock_bh(&in6_dev->lock);
2108 			}
2109 #endif
2110 			in6_ifa_put(ifp);
2111 			addrconf_verify(0);
2112 		}
2113 	}
2114 	inet6_prefix_notify(RTM_NEWPREFIX, in6_dev, pinfo);
2115 	in6_dev_put(in6_dev);
2116 }
2117 
2118 /*
2119  *	Set destination address.
2120  *	Special case for SIT interfaces where we create a new "virtual"
2121  *	device.
2122  */
addrconf_set_dstaddr(struct net * net,void __user * arg)2123 int addrconf_set_dstaddr(struct net *net, void __user *arg)
2124 {
2125 	struct in6_ifreq ireq;
2126 	struct net_device *dev;
2127 	int err = -EINVAL;
2128 
2129 	rtnl_lock();
2130 
2131 	err = -EFAULT;
2132 	if (copy_from_user(&ireq, arg, sizeof(struct in6_ifreq)))
2133 		goto err_exit;
2134 
2135 	dev = __dev_get_by_index(net, ireq.ifr6_ifindex);
2136 
2137 	err = -ENODEV;
2138 	if (dev == NULL)
2139 		goto err_exit;
2140 
2141 #if defined(CONFIG_IPV6_SIT) || defined(CONFIG_IPV6_SIT_MODULE)
2142 	if (dev->type == ARPHRD_SIT) {
2143 		const struct net_device_ops *ops = dev->netdev_ops;
2144 		struct ifreq ifr;
2145 		struct ip_tunnel_parm p;
2146 
2147 		err = -EADDRNOTAVAIL;
2148 		if (!(ipv6_addr_type(&ireq.ifr6_addr) & IPV6_ADDR_COMPATv4))
2149 			goto err_exit;
2150 
2151 		memset(&p, 0, sizeof(p));
2152 		p.iph.daddr = ireq.ifr6_addr.s6_addr32[3];
2153 		p.iph.saddr = 0;
2154 		p.iph.version = 4;
2155 		p.iph.ihl = 5;
2156 		p.iph.protocol = IPPROTO_IPV6;
2157 		p.iph.ttl = 64;
2158 		ifr.ifr_ifru.ifru_data = (__force void __user *)&p;
2159 
2160 		if (ops->ndo_do_ioctl) {
2161 			mm_segment_t oldfs = get_fs();
2162 
2163 			set_fs(KERNEL_DS);
2164 			err = ops->ndo_do_ioctl(dev, &ifr, SIOCADDTUNNEL);
2165 			set_fs(oldfs);
2166 		} else
2167 			err = -EOPNOTSUPP;
2168 
2169 		if (err == 0) {
2170 			err = -ENOBUFS;
2171 			dev = __dev_get_by_name(net, p.name);
2172 			if (!dev)
2173 				goto err_exit;
2174 			err = dev_open(dev);
2175 		}
2176 	}
2177 #endif
2178 
2179 err_exit:
2180 	rtnl_unlock();
2181 	return err;
2182 }
2183 
2184 /*
2185  *	Manual configuration of address on an interface
2186  */
inet6_addr_add(struct net * net,int ifindex,const struct in6_addr * pfx,unsigned int plen,__u8 ifa_flags,__u32 prefered_lft,__u32 valid_lft)2187 static int inet6_addr_add(struct net *net, int ifindex, const struct in6_addr *pfx,
2188 			  unsigned int plen, __u8 ifa_flags, __u32 prefered_lft,
2189 			  __u32 valid_lft)
2190 {
2191 	struct inet6_ifaddr *ifp;
2192 	struct inet6_dev *idev;
2193 	struct net_device *dev;
2194 	int scope;
2195 	u32 flags;
2196 	clock_t expires;
2197 	unsigned long timeout;
2198 
2199 	ASSERT_RTNL();
2200 
2201 	if (plen > 128)
2202 		return -EINVAL;
2203 
2204 	/* check the lifetime */
2205 	if (!valid_lft || prefered_lft > valid_lft)
2206 		return -EINVAL;
2207 
2208 	dev = __dev_get_by_index(net, ifindex);
2209 	if (!dev)
2210 		return -ENODEV;
2211 
2212 	idev = addrconf_add_dev(dev);
2213 	if (IS_ERR(idev))
2214 		return PTR_ERR(idev);
2215 
2216 	scope = ipv6_addr_scope(pfx);
2217 
2218 	timeout = addrconf_timeout_fixup(valid_lft, HZ);
2219 	if (addrconf_finite_timeout(timeout)) {
2220 		expires = jiffies_to_clock_t(timeout * HZ);
2221 		valid_lft = timeout;
2222 		flags = RTF_EXPIRES;
2223 	} else {
2224 		expires = 0;
2225 		flags = 0;
2226 		ifa_flags |= IFA_F_PERMANENT;
2227 	}
2228 
2229 	timeout = addrconf_timeout_fixup(prefered_lft, HZ);
2230 	if (addrconf_finite_timeout(timeout)) {
2231 		if (timeout == 0)
2232 			ifa_flags |= IFA_F_DEPRECATED;
2233 		prefered_lft = timeout;
2234 	}
2235 
2236 	ifp = ipv6_add_addr(idev, pfx, plen, scope, ifa_flags);
2237 
2238 	if (!IS_ERR(ifp)) {
2239 		spin_lock_bh(&ifp->lock);
2240 		ifp->valid_lft = valid_lft;
2241 		ifp->prefered_lft = prefered_lft;
2242 		ifp->tstamp = jiffies;
2243 		spin_unlock_bh(&ifp->lock);
2244 
2245 		addrconf_prefix_route(&ifp->addr, ifp->prefix_len, dev,
2246 				      expires, flags);
2247 		/*
2248 		 * Note that section 3.1 of RFC 4429 indicates
2249 		 * that the Optimistic flag should not be set for
2250 		 * manually configured addresses
2251 		 */
2252 		addrconf_dad_start(ifp, 0);
2253 		in6_ifa_put(ifp);
2254 		addrconf_verify(0);
2255 		return 0;
2256 	}
2257 
2258 	return PTR_ERR(ifp);
2259 }
2260 
inet6_addr_del(struct net * net,int ifindex,const struct in6_addr * pfx,unsigned int plen)2261 static int inet6_addr_del(struct net *net, int ifindex, const struct in6_addr *pfx,
2262 			  unsigned int plen)
2263 {
2264 	struct inet6_ifaddr *ifp;
2265 	struct inet6_dev *idev;
2266 	struct net_device *dev;
2267 
2268 	if (plen > 128)
2269 		return -EINVAL;
2270 
2271 	dev = __dev_get_by_index(net, ifindex);
2272 	if (!dev)
2273 		return -ENODEV;
2274 
2275 	if ((idev = __in6_dev_get(dev)) == NULL)
2276 		return -ENXIO;
2277 
2278 	read_lock_bh(&idev->lock);
2279 	list_for_each_entry(ifp, &idev->addr_list, if_list) {
2280 		if (ifp->prefix_len == plen &&
2281 		    ipv6_addr_equal(pfx, &ifp->addr)) {
2282 			in6_ifa_hold(ifp);
2283 			read_unlock_bh(&idev->lock);
2284 
2285 			ipv6_del_addr(ifp);
2286 
2287 			/* If the last address is deleted administratively,
2288 			   disable IPv6 on this interface.
2289 			 */
2290 			if (list_empty(&idev->addr_list))
2291 				addrconf_ifdown(idev->dev, 1);
2292 			return 0;
2293 		}
2294 	}
2295 	read_unlock_bh(&idev->lock);
2296 	return -EADDRNOTAVAIL;
2297 }
2298 
2299 
addrconf_add_ifaddr(struct net * net,void __user * arg)2300 int addrconf_add_ifaddr(struct net *net, void __user *arg)
2301 {
2302 	struct in6_ifreq ireq;
2303 	int err;
2304 
2305 	if (!capable(CAP_NET_ADMIN))
2306 		return -EPERM;
2307 
2308 	if (copy_from_user(&ireq, arg, sizeof(struct in6_ifreq)))
2309 		return -EFAULT;
2310 
2311 	rtnl_lock();
2312 	err = inet6_addr_add(net, ireq.ifr6_ifindex, &ireq.ifr6_addr,
2313 			     ireq.ifr6_prefixlen, IFA_F_PERMANENT,
2314 			     INFINITY_LIFE_TIME, INFINITY_LIFE_TIME);
2315 	rtnl_unlock();
2316 	return err;
2317 }
2318 
addrconf_del_ifaddr(struct net * net,void __user * arg)2319 int addrconf_del_ifaddr(struct net *net, void __user *arg)
2320 {
2321 	struct in6_ifreq ireq;
2322 	int err;
2323 
2324 	if (!capable(CAP_NET_ADMIN))
2325 		return -EPERM;
2326 
2327 	if (copy_from_user(&ireq, arg, sizeof(struct in6_ifreq)))
2328 		return -EFAULT;
2329 
2330 	rtnl_lock();
2331 	err = inet6_addr_del(net, ireq.ifr6_ifindex, &ireq.ifr6_addr,
2332 			     ireq.ifr6_prefixlen);
2333 	rtnl_unlock();
2334 	return err;
2335 }
2336 
add_addr(struct inet6_dev * idev,const struct in6_addr * addr,int plen,int scope)2337 static void add_addr(struct inet6_dev *idev, const struct in6_addr *addr,
2338 		     int plen, int scope)
2339 {
2340 	struct inet6_ifaddr *ifp;
2341 
2342 	ifp = ipv6_add_addr(idev, addr, plen, scope, IFA_F_PERMANENT);
2343 	if (!IS_ERR(ifp)) {
2344 		spin_lock_bh(&ifp->lock);
2345 		ifp->flags &= ~IFA_F_TENTATIVE;
2346 		spin_unlock_bh(&ifp->lock);
2347 		ipv6_ifa_notify(RTM_NEWADDR, ifp);
2348 		in6_ifa_put(ifp);
2349 	}
2350 }
2351 
2352 #if defined(CONFIG_IPV6_SIT) || defined(CONFIG_IPV6_SIT_MODULE)
sit_add_v4_addrs(struct inet6_dev * idev)2353 static void sit_add_v4_addrs(struct inet6_dev *idev)
2354 {
2355 	struct in6_addr addr;
2356 	struct net_device *dev;
2357 	struct net *net = dev_net(idev->dev);
2358 	int scope;
2359 
2360 	ASSERT_RTNL();
2361 
2362 	memset(&addr, 0, sizeof(struct in6_addr));
2363 	memcpy(&addr.s6_addr32[3], idev->dev->dev_addr, 4);
2364 
2365 	if (idev->dev->flags&IFF_POINTOPOINT) {
2366 		addr.s6_addr32[0] = htonl(0xfe800000);
2367 		scope = IFA_LINK;
2368 	} else {
2369 		scope = IPV6_ADDR_COMPATv4;
2370 	}
2371 
2372 	if (addr.s6_addr32[3]) {
2373 		add_addr(idev, &addr, 128, scope);
2374 		return;
2375 	}
2376 
2377 	for_each_netdev(net, dev) {
2378 		struct in_device * in_dev = __in_dev_get_rtnl(dev);
2379 		if (in_dev && (dev->flags & IFF_UP)) {
2380 			struct in_ifaddr * ifa;
2381 
2382 			int flag = scope;
2383 
2384 			for (ifa = in_dev->ifa_list; ifa; ifa = ifa->ifa_next) {
2385 				int plen;
2386 
2387 				addr.s6_addr32[3] = ifa->ifa_local;
2388 
2389 				if (ifa->ifa_scope == RT_SCOPE_LINK)
2390 					continue;
2391 				if (ifa->ifa_scope >= RT_SCOPE_HOST) {
2392 					if (idev->dev->flags&IFF_POINTOPOINT)
2393 						continue;
2394 					flag |= IFA_HOST;
2395 				}
2396 				if (idev->dev->flags&IFF_POINTOPOINT)
2397 					plen = 64;
2398 				else
2399 					plen = 96;
2400 
2401 				add_addr(idev, &addr, plen, flag);
2402 			}
2403 		}
2404 	}
2405 }
2406 #endif
2407 
init_loopback(struct net_device * dev)2408 static void init_loopback(struct net_device *dev)
2409 {
2410 	struct inet6_dev  *idev;
2411 	struct net_device *sp_dev;
2412 	struct inet6_ifaddr *sp_ifa;
2413 	struct rt6_info *sp_rt;
2414 
2415 	/* ::1 */
2416 
2417 	ASSERT_RTNL();
2418 
2419 	if ((idev = ipv6_find_idev(dev)) == NULL) {
2420 		printk(KERN_DEBUG "init loopback: add_dev failed\n");
2421 		return;
2422 	}
2423 
2424 	add_addr(idev, &in6addr_loopback, 128, IFA_HOST);
2425 
2426 	/* Add routes to other interface's IPv6 addresses */
2427 	for_each_netdev(dev_net(dev), sp_dev) {
2428 		if (!strcmp(sp_dev->name, dev->name))
2429 			continue;
2430 
2431 		idev = __in6_dev_get(sp_dev);
2432 		if (!idev)
2433 			continue;
2434 
2435 		read_lock_bh(&idev->lock);
2436 		list_for_each_entry(sp_ifa, &idev->addr_list, if_list) {
2437 
2438 			if (sp_ifa->flags & (IFA_F_DADFAILED | IFA_F_TENTATIVE))
2439 				continue;
2440 
2441 			if (sp_ifa->rt)
2442 				continue;
2443 
2444 			sp_rt = addrconf_dst_alloc(idev, &sp_ifa->addr, 0);
2445 
2446 			/* Failure cases are ignored */
2447 			if (!IS_ERR(sp_rt)) {
2448 				sp_ifa->rt = sp_rt;
2449 				ip6_ins_rt(sp_rt);
2450 			}
2451 		}
2452 		read_unlock_bh(&idev->lock);
2453 	}
2454 }
2455 
addrconf_add_linklocal(struct inet6_dev * idev,const struct in6_addr * addr)2456 static void addrconf_add_linklocal(struct inet6_dev *idev, const struct in6_addr *addr)
2457 {
2458 	struct inet6_ifaddr * ifp;
2459 	u32 addr_flags = IFA_F_PERMANENT;
2460 
2461 #ifdef CONFIG_IPV6_OPTIMISTIC_DAD
2462 	if (idev->cnf.optimistic_dad &&
2463 	    !dev_net(idev->dev)->ipv6.devconf_all->forwarding)
2464 		addr_flags |= IFA_F_OPTIMISTIC;
2465 #endif
2466 
2467 
2468 	ifp = ipv6_add_addr(idev, addr, 64, IFA_LINK, addr_flags);
2469 	if (!IS_ERR(ifp)) {
2470 		addrconf_prefix_route(&ifp->addr, ifp->prefix_len, idev->dev, 0, 0);
2471 		addrconf_dad_start(ifp, 0);
2472 		in6_ifa_put(ifp);
2473 	}
2474 }
2475 
addrconf_dev_config(struct net_device * dev)2476 static void addrconf_dev_config(struct net_device *dev)
2477 {
2478 	struct in6_addr addr;
2479 	struct inet6_dev    * idev;
2480 
2481 	ASSERT_RTNL();
2482 
2483 	if ((dev->type != ARPHRD_ETHER) &&
2484 	    (dev->type != ARPHRD_FDDI) &&
2485 	    (dev->type != ARPHRD_IEEE802_TR) &&
2486 	    (dev->type != ARPHRD_ARCNET) &&
2487 	    (dev->type != ARPHRD_INFINIBAND)) {
2488 		/* Alas, we support only Ethernet autoconfiguration. */
2489 		return;
2490 	}
2491 
2492 	idev = addrconf_add_dev(dev);
2493 	if (IS_ERR(idev))
2494 		return;
2495 
2496 	memset(&addr, 0, sizeof(struct in6_addr));
2497 	addr.s6_addr32[0] = htonl(0xFE800000);
2498 
2499 	if (ipv6_generate_eui64(addr.s6_addr + 8, dev) == 0)
2500 		addrconf_add_linklocal(idev, &addr);
2501 }
2502 
2503 #if defined(CONFIG_IPV6_SIT) || defined(CONFIG_IPV6_SIT_MODULE)
addrconf_sit_config(struct net_device * dev)2504 static void addrconf_sit_config(struct net_device *dev)
2505 {
2506 	struct inet6_dev *idev;
2507 
2508 	ASSERT_RTNL();
2509 
2510 	/*
2511 	 * Configure the tunnel with one of our IPv4
2512 	 * addresses... we should configure all of
2513 	 * our v4 addrs in the tunnel
2514 	 */
2515 
2516 	if ((idev = ipv6_find_idev(dev)) == NULL) {
2517 		printk(KERN_DEBUG "init sit: add_dev failed\n");
2518 		return;
2519 	}
2520 
2521 	if (dev->priv_flags & IFF_ISATAP) {
2522 		struct in6_addr addr;
2523 
2524 		ipv6_addr_set(&addr,  htonl(0xFE800000), 0, 0, 0);
2525 		addrconf_prefix_route(&addr, 64, dev, 0, 0);
2526 		if (!ipv6_generate_eui64(addr.s6_addr + 8, dev))
2527 			addrconf_add_linklocal(idev, &addr);
2528 		return;
2529 	}
2530 
2531 	sit_add_v4_addrs(idev);
2532 
2533 	if (dev->flags&IFF_POINTOPOINT) {
2534 		addrconf_add_mroute(dev);
2535 		addrconf_add_lroute(dev);
2536 	} else
2537 		sit_route_add(dev);
2538 }
2539 #endif
2540 
2541 #if defined(CONFIG_NET_IPGRE) || defined(CONFIG_NET_IPGRE_MODULE)
addrconf_gre_config(struct net_device * dev)2542 static void addrconf_gre_config(struct net_device *dev)
2543 {
2544 	struct inet6_dev *idev;
2545 	struct in6_addr addr;
2546 
2547 	pr_info("ipv6: addrconf_gre_config(%s)\n", dev->name);
2548 
2549 	ASSERT_RTNL();
2550 
2551 	if ((idev = ipv6_find_idev(dev)) == NULL) {
2552 		printk(KERN_DEBUG "init gre: add_dev failed\n");
2553 		return;
2554 	}
2555 
2556 	ipv6_addr_set(&addr,  htonl(0xFE800000), 0, 0, 0);
2557 	addrconf_prefix_route(&addr, 64, dev, 0, 0);
2558 
2559 	if (!ipv6_generate_eui64(addr.s6_addr + 8, dev))
2560 		addrconf_add_linklocal(idev, &addr);
2561 }
2562 #endif
2563 
2564 static inline int
ipv6_inherit_linklocal(struct inet6_dev * idev,struct net_device * link_dev)2565 ipv6_inherit_linklocal(struct inet6_dev *idev, struct net_device *link_dev)
2566 {
2567 	struct in6_addr lladdr;
2568 
2569 	if (!ipv6_get_lladdr(link_dev, &lladdr, IFA_F_TENTATIVE)) {
2570 		addrconf_add_linklocal(idev, &lladdr);
2571 		return 0;
2572 	}
2573 	return -1;
2574 }
2575 
ip6_tnl_add_linklocal(struct inet6_dev * idev)2576 static void ip6_tnl_add_linklocal(struct inet6_dev *idev)
2577 {
2578 	struct net_device *link_dev;
2579 	struct net *net = dev_net(idev->dev);
2580 
2581 	/* first try to inherit the link-local address from the link device */
2582 	if (idev->dev->iflink &&
2583 	    (link_dev = __dev_get_by_index(net, idev->dev->iflink))) {
2584 		if (!ipv6_inherit_linklocal(idev, link_dev))
2585 			return;
2586 	}
2587 	/* then try to inherit it from any device */
2588 	for_each_netdev(net, link_dev) {
2589 		if (!ipv6_inherit_linklocal(idev, link_dev))
2590 			return;
2591 	}
2592 	printk(KERN_DEBUG "init ip6-ip6: add_linklocal failed\n");
2593 }
2594 
2595 /*
2596  * Autoconfigure tunnel with a link-local address so routing protocols,
2597  * DHCPv6, MLD etc. can be run over the virtual link
2598  */
2599 
addrconf_ip6_tnl_config(struct net_device * dev)2600 static void addrconf_ip6_tnl_config(struct net_device *dev)
2601 {
2602 	struct inet6_dev *idev;
2603 
2604 	ASSERT_RTNL();
2605 
2606 	idev = addrconf_add_dev(dev);
2607 	if (IS_ERR(idev)) {
2608 		printk(KERN_DEBUG "init ip6-ip6: add_dev failed\n");
2609 		return;
2610 	}
2611 	ip6_tnl_add_linklocal(idev);
2612 }
2613 
addrconf_notify(struct notifier_block * this,unsigned long event,void * data)2614 static int addrconf_notify(struct notifier_block *this, unsigned long event,
2615 			   void * data)
2616 {
2617 	struct net_device *dev = (struct net_device *) data;
2618 	struct inet6_dev *idev = __in6_dev_get(dev);
2619 	int run_pending = 0;
2620 	int err;
2621 
2622 	switch (event) {
2623 	case NETDEV_REGISTER:
2624 		if (!idev && dev->mtu >= IPV6_MIN_MTU) {
2625 			idev = ipv6_add_dev(dev);
2626 			if (!idev)
2627 				return notifier_from_errno(-ENOMEM);
2628 		}
2629 		break;
2630 
2631 	case NETDEV_UP:
2632 	case NETDEV_CHANGE:
2633 		if (dev->flags & IFF_SLAVE)
2634 			break;
2635 
2636 		if (event == NETDEV_UP) {
2637 			if (!addrconf_qdisc_ok(dev)) {
2638 				/* device is not ready yet. */
2639 				printk(KERN_INFO
2640 					"ADDRCONF(NETDEV_UP): %s: "
2641 					"link is not ready\n",
2642 					dev->name);
2643 				break;
2644 			}
2645 
2646 			if (!idev && dev->mtu >= IPV6_MIN_MTU)
2647 				idev = ipv6_add_dev(dev);
2648 
2649 			if (idev) {
2650 				idev->if_flags |= IF_READY;
2651 				run_pending = 1;
2652 			}
2653 		} else {
2654 			if (!addrconf_qdisc_ok(dev)) {
2655 				/* device is still not ready. */
2656 				break;
2657 			}
2658 
2659 			if (idev) {
2660 				if (idev->if_flags & IF_READY)
2661 					/* device is already configured. */
2662 					break;
2663 				idev->if_flags |= IF_READY;
2664 			}
2665 
2666 			printk(KERN_INFO
2667 					"ADDRCONF(NETDEV_CHANGE): %s: "
2668 					"link becomes ready\n",
2669 					dev->name);
2670 
2671 			run_pending = 1;
2672 		}
2673 
2674 		switch (dev->type) {
2675 #if defined(CONFIG_IPV6_SIT) || defined(CONFIG_IPV6_SIT_MODULE)
2676 		case ARPHRD_SIT:
2677 			addrconf_sit_config(dev);
2678 			break;
2679 #endif
2680 #if defined(CONFIG_NET_IPGRE) || defined(CONFIG_NET_IPGRE_MODULE)
2681 		case ARPHRD_IPGRE:
2682 			addrconf_gre_config(dev);
2683 			break;
2684 #endif
2685 		case ARPHRD_TUNNEL6:
2686 			addrconf_ip6_tnl_config(dev);
2687 			break;
2688 		case ARPHRD_LOOPBACK:
2689 			init_loopback(dev);
2690 			break;
2691 
2692 		default:
2693 			addrconf_dev_config(dev);
2694 			break;
2695 		}
2696 
2697 		if (idev) {
2698 			if (run_pending)
2699 				addrconf_dad_run(idev);
2700 
2701 			/*
2702 			 * If the MTU changed during the interface down,
2703 			 * when the interface up, the changed MTU must be
2704 			 * reflected in the idev as well as routers.
2705 			 */
2706 			if (idev->cnf.mtu6 != dev->mtu &&
2707 			    dev->mtu >= IPV6_MIN_MTU) {
2708 				rt6_mtu_change(dev, dev->mtu);
2709 				idev->cnf.mtu6 = dev->mtu;
2710 			}
2711 			idev->tstamp = jiffies;
2712 			inet6_ifinfo_notify(RTM_NEWLINK, idev);
2713 
2714 			/*
2715 			 * If the changed mtu during down is lower than
2716 			 * IPV6_MIN_MTU stop IPv6 on this interface.
2717 			 */
2718 			if (dev->mtu < IPV6_MIN_MTU)
2719 				addrconf_ifdown(dev, 1);
2720 		}
2721 		break;
2722 
2723 	case NETDEV_CHANGEMTU:
2724 		if (idev && dev->mtu >= IPV6_MIN_MTU) {
2725 			rt6_mtu_change(dev, dev->mtu);
2726 			idev->cnf.mtu6 = dev->mtu;
2727 			break;
2728 		}
2729 
2730 		if (!idev && dev->mtu >= IPV6_MIN_MTU) {
2731 			idev = ipv6_add_dev(dev);
2732 			if (idev)
2733 				break;
2734 		}
2735 
2736 		/*
2737 		 * MTU falled under IPV6_MIN_MTU.
2738 		 * Stop IPv6 on this interface.
2739 		 */
2740 
2741 	case NETDEV_DOWN:
2742 	case NETDEV_UNREGISTER:
2743 		/*
2744 		 *	Remove all addresses from this interface.
2745 		 */
2746 		addrconf_ifdown(dev, event != NETDEV_DOWN);
2747 		break;
2748 
2749 	case NETDEV_CHANGENAME:
2750 		if (idev) {
2751 			snmp6_unregister_dev(idev);
2752 			addrconf_sysctl_unregister(idev);
2753 			addrconf_sysctl_register(idev);
2754 			err = snmp6_register_dev(idev);
2755 			if (err)
2756 				return notifier_from_errno(err);
2757 		}
2758 		break;
2759 
2760 	case NETDEV_PRE_TYPE_CHANGE:
2761 	case NETDEV_POST_TYPE_CHANGE:
2762 		addrconf_type_change(dev, event);
2763 		break;
2764 	}
2765 
2766 	return NOTIFY_OK;
2767 }
2768 
2769 /*
2770  *	addrconf module should be notified of a device going up
2771  */
2772 static struct notifier_block ipv6_dev_notf = {
2773 	.notifier_call = addrconf_notify,
2774 };
2775 
addrconf_type_change(struct net_device * dev,unsigned long event)2776 static void addrconf_type_change(struct net_device *dev, unsigned long event)
2777 {
2778 	struct inet6_dev *idev;
2779 	ASSERT_RTNL();
2780 
2781 	idev = __in6_dev_get(dev);
2782 
2783 	if (event == NETDEV_POST_TYPE_CHANGE)
2784 		ipv6_mc_remap(idev);
2785 	else if (event == NETDEV_PRE_TYPE_CHANGE)
2786 		ipv6_mc_unmap(idev);
2787 }
2788 
addrconf_ifdown(struct net_device * dev,int how)2789 static int addrconf_ifdown(struct net_device *dev, int how)
2790 {
2791 	struct net *net = dev_net(dev);
2792 	struct inet6_dev *idev;
2793 	struct inet6_ifaddr *ifa;
2794 	int state, i;
2795 
2796 	ASSERT_RTNL();
2797 
2798 	rt6_ifdown(net, dev);
2799 	neigh_ifdown(&nd_tbl, dev);
2800 
2801 	idev = __in6_dev_get(dev);
2802 	if (idev == NULL)
2803 		return -ENODEV;
2804 
2805 	/*
2806 	 * Step 1: remove reference to ipv6 device from parent device.
2807 	 *	   Do not dev_put!
2808 	 */
2809 	if (how) {
2810 		idev->dead = 1;
2811 
2812 		/* protected by rtnl_lock */
2813 		RCU_INIT_POINTER(dev->ip6_ptr, NULL);
2814 
2815 		/* Step 1.5: remove snmp6 entry */
2816 		snmp6_unregister_dev(idev);
2817 
2818 	}
2819 
2820 	/* Step 2: clear hash table */
2821 	for (i = 0; i < IN6_ADDR_HSIZE; i++) {
2822 		struct hlist_head *h = &inet6_addr_lst[i];
2823 		struct hlist_node *n;
2824 
2825 		spin_lock_bh(&addrconf_hash_lock);
2826 	restart:
2827 		hlist_for_each_entry_rcu(ifa, n, h, addr_lst) {
2828 			if (ifa->idev == idev) {
2829 				hlist_del_init_rcu(&ifa->addr_lst);
2830 				addrconf_del_timer(ifa);
2831 				goto restart;
2832 			}
2833 		}
2834 		spin_unlock_bh(&addrconf_hash_lock);
2835 	}
2836 
2837 	write_lock_bh(&idev->lock);
2838 
2839 	/* Step 2: clear flags for stateless addrconf */
2840 	if (!how)
2841 		idev->if_flags &= ~(IF_RS_SENT|IF_RA_RCVD|IF_READY);
2842 
2843 #ifdef CONFIG_IPV6_PRIVACY
2844 	if (how && del_timer(&idev->regen_timer))
2845 		in6_dev_put(idev);
2846 
2847 	/* Step 3: clear tempaddr list */
2848 	while (!list_empty(&idev->tempaddr_list)) {
2849 		ifa = list_first_entry(&idev->tempaddr_list,
2850 				       struct inet6_ifaddr, tmp_list);
2851 		list_del(&ifa->tmp_list);
2852 		write_unlock_bh(&idev->lock);
2853 		spin_lock_bh(&ifa->lock);
2854 
2855 		if (ifa->ifpub) {
2856 			in6_ifa_put(ifa->ifpub);
2857 			ifa->ifpub = NULL;
2858 		}
2859 		spin_unlock_bh(&ifa->lock);
2860 		in6_ifa_put(ifa);
2861 		write_lock_bh(&idev->lock);
2862 	}
2863 #endif
2864 
2865 	while (!list_empty(&idev->addr_list)) {
2866 		ifa = list_first_entry(&idev->addr_list,
2867 				       struct inet6_ifaddr, if_list);
2868 		addrconf_del_timer(ifa);
2869 
2870 		list_del(&ifa->if_list);
2871 
2872 		write_unlock_bh(&idev->lock);
2873 
2874 		spin_lock_bh(&ifa->state_lock);
2875 		state = ifa->state;
2876 		ifa->state = INET6_IFADDR_STATE_DEAD;
2877 		spin_unlock_bh(&ifa->state_lock);
2878 
2879 		if (state != INET6_IFADDR_STATE_DEAD) {
2880 			__ipv6_ifa_notify(RTM_DELADDR, ifa);
2881 			atomic_notifier_call_chain(&inet6addr_chain, NETDEV_DOWN, ifa);
2882 		}
2883 		in6_ifa_put(ifa);
2884 
2885 		write_lock_bh(&idev->lock);
2886 	}
2887 
2888 	write_unlock_bh(&idev->lock);
2889 
2890 	/* Step 5: Discard multicast list */
2891 	if (how)
2892 		ipv6_mc_destroy_dev(idev);
2893 	else
2894 		ipv6_mc_down(idev);
2895 
2896 	idev->tstamp = jiffies;
2897 
2898 	/* Last: Shot the device (if unregistered) */
2899 	if (how) {
2900 		addrconf_sysctl_unregister(idev);
2901 		neigh_parms_release(&nd_tbl, idev->nd_parms);
2902 		neigh_ifdown(&nd_tbl, dev);
2903 		in6_dev_put(idev);
2904 	}
2905 	return 0;
2906 }
2907 
addrconf_rs_timer(unsigned long data)2908 static void addrconf_rs_timer(unsigned long data)
2909 {
2910 	struct inet6_ifaddr *ifp = (struct inet6_ifaddr *) data;
2911 	struct inet6_dev *idev = ifp->idev;
2912 
2913 	read_lock(&idev->lock);
2914 	if (idev->dead || !(idev->if_flags & IF_READY))
2915 		goto out;
2916 
2917 	if (idev->cnf.forwarding)
2918 		goto out;
2919 
2920 	/* Announcement received after solicitation was sent */
2921 	if (idev->if_flags & IF_RA_RCVD)
2922 		goto out;
2923 
2924 	spin_lock(&ifp->lock);
2925 	if (ifp->probes++ < idev->cnf.rtr_solicits) {
2926 		/* The wait after the last probe can be shorter */
2927 		addrconf_mod_timer(ifp, AC_RS,
2928 				   (ifp->probes == idev->cnf.rtr_solicits) ?
2929 				   idev->cnf.rtr_solicit_delay :
2930 				   idev->cnf.rtr_solicit_interval);
2931 		spin_unlock(&ifp->lock);
2932 
2933 		ndisc_send_rs(idev->dev, &ifp->addr, &in6addr_linklocal_allrouters);
2934 	} else {
2935 		spin_unlock(&ifp->lock);
2936 		/*
2937 		 * Note: we do not support deprecated "all on-link"
2938 		 * assumption any longer.
2939 		 */
2940 		printk(KERN_DEBUG "%s: no IPv6 routers present\n",
2941 		       idev->dev->name);
2942 	}
2943 
2944 out:
2945 	read_unlock(&idev->lock);
2946 	in6_ifa_put(ifp);
2947 }
2948 
2949 /*
2950  *	Duplicate Address Detection
2951  */
addrconf_dad_kick(struct inet6_ifaddr * ifp)2952 static void addrconf_dad_kick(struct inet6_ifaddr *ifp)
2953 {
2954 	unsigned long rand_num;
2955 	struct inet6_dev *idev = ifp->idev;
2956 
2957 	if (ifp->flags & IFA_F_OPTIMISTIC)
2958 		rand_num = 0;
2959 	else
2960 		rand_num = net_random() % (idev->cnf.rtr_solicit_delay ? : 1);
2961 
2962 	ifp->probes = idev->cnf.dad_transmits;
2963 	addrconf_mod_timer(ifp, AC_DAD, rand_num);
2964 }
2965 
addrconf_dad_start(struct inet6_ifaddr * ifp,u32 flags)2966 static void addrconf_dad_start(struct inet6_ifaddr *ifp, u32 flags)
2967 {
2968 	struct inet6_dev *idev = ifp->idev;
2969 	struct net_device *dev = idev->dev;
2970 
2971 	addrconf_join_solict(dev, &ifp->addr);
2972 
2973 	net_srandom(ifp->addr.s6_addr32[3]);
2974 
2975 	read_lock_bh(&idev->lock);
2976 	spin_lock(&ifp->lock);
2977 	if (ifp->state == INET6_IFADDR_STATE_DEAD)
2978 		goto out;
2979 
2980 	if (dev->flags&(IFF_NOARP|IFF_LOOPBACK) ||
2981 	    idev->cnf.accept_dad < 1 ||
2982 	    !(ifp->flags&IFA_F_TENTATIVE) ||
2983 	    ifp->flags & IFA_F_NODAD) {
2984 		ifp->flags &= ~(IFA_F_TENTATIVE|IFA_F_OPTIMISTIC|IFA_F_DADFAILED);
2985 		spin_unlock(&ifp->lock);
2986 		read_unlock_bh(&idev->lock);
2987 
2988 		addrconf_dad_completed(ifp);
2989 		return;
2990 	}
2991 
2992 	if (!(idev->if_flags & IF_READY)) {
2993 		spin_unlock(&ifp->lock);
2994 		read_unlock_bh(&idev->lock);
2995 		/*
2996 		 * If the device is not ready:
2997 		 * - keep it tentative if it is a permanent address.
2998 		 * - otherwise, kill it.
2999 		 */
3000 		in6_ifa_hold(ifp);
3001 		addrconf_dad_stop(ifp, 0);
3002 		return;
3003 	}
3004 
3005 	/*
3006 	 * Optimistic nodes can start receiving
3007 	 * Frames right away
3008 	 */
3009 	if (ifp->flags & IFA_F_OPTIMISTIC)
3010 		ip6_ins_rt(ifp->rt);
3011 
3012 	addrconf_dad_kick(ifp);
3013 out:
3014 	spin_unlock(&ifp->lock);
3015 	read_unlock_bh(&idev->lock);
3016 }
3017 
addrconf_dad_timer(unsigned long data)3018 static void addrconf_dad_timer(unsigned long data)
3019 {
3020 	struct inet6_ifaddr *ifp = (struct inet6_ifaddr *) data;
3021 	struct inet6_dev *idev = ifp->idev;
3022 	struct in6_addr mcaddr;
3023 
3024 	if (!ifp->probes && addrconf_dad_end(ifp))
3025 		goto out;
3026 
3027 	read_lock(&idev->lock);
3028 	if (idev->dead || !(idev->if_flags & IF_READY)) {
3029 		read_unlock(&idev->lock);
3030 		goto out;
3031 	}
3032 
3033 	spin_lock(&ifp->lock);
3034 	if (ifp->state == INET6_IFADDR_STATE_DEAD) {
3035 		spin_unlock(&ifp->lock);
3036 		read_unlock(&idev->lock);
3037 		goto out;
3038 	}
3039 
3040 	if (ifp->probes == 0) {
3041 		/*
3042 		 * DAD was successful
3043 		 */
3044 
3045 		ifp->flags &= ~(IFA_F_TENTATIVE|IFA_F_OPTIMISTIC|IFA_F_DADFAILED);
3046 		spin_unlock(&ifp->lock);
3047 		read_unlock(&idev->lock);
3048 
3049 		addrconf_dad_completed(ifp);
3050 
3051 		goto out;
3052 	}
3053 
3054 	ifp->probes--;
3055 	addrconf_mod_timer(ifp, AC_DAD, ifp->idev->nd_parms->retrans_time);
3056 	spin_unlock(&ifp->lock);
3057 	read_unlock(&idev->lock);
3058 
3059 	/* send a neighbour solicitation for our addr */
3060 	addrconf_addr_solict_mult(&ifp->addr, &mcaddr);
3061 	ndisc_send_ns(ifp->idev->dev, NULL, &ifp->addr, &mcaddr, &in6addr_any);
3062 out:
3063 	in6_ifa_put(ifp);
3064 }
3065 
addrconf_dad_completed(struct inet6_ifaddr * ifp)3066 static void addrconf_dad_completed(struct inet6_ifaddr *ifp)
3067 {
3068 	struct net_device *dev = ifp->idev->dev;
3069 
3070 	/*
3071 	 *	Configure the address for reception. Now it is valid.
3072 	 */
3073 
3074 	ipv6_ifa_notify(RTM_NEWADDR, ifp);
3075 
3076 	/* If added prefix is link local and we are prepared to process
3077 	   router advertisements, start sending router solicitations.
3078 	 */
3079 
3080 	if (((ifp->idev->cnf.accept_ra == 1 && !ifp->idev->cnf.forwarding) ||
3081 	     ifp->idev->cnf.accept_ra == 2) &&
3082 	    ifp->idev->cnf.rtr_solicits > 0 &&
3083 	    (dev->flags&IFF_LOOPBACK) == 0 &&
3084 	    (ipv6_addr_type(&ifp->addr) & IPV6_ADDR_LINKLOCAL)) {
3085 		/*
3086 		 *	If a host as already performed a random delay
3087 		 *	[...] as part of DAD [...] there is no need
3088 		 *	to delay again before sending the first RS
3089 		 */
3090 		ndisc_send_rs(ifp->idev->dev, &ifp->addr, &in6addr_linklocal_allrouters);
3091 
3092 		spin_lock_bh(&ifp->lock);
3093 		ifp->probes = 1;
3094 		ifp->idev->if_flags |= IF_RS_SENT;
3095 		addrconf_mod_timer(ifp, AC_RS, ifp->idev->cnf.rtr_solicit_interval);
3096 		spin_unlock_bh(&ifp->lock);
3097 	}
3098 }
3099 
addrconf_dad_run(struct inet6_dev * idev)3100 static void addrconf_dad_run(struct inet6_dev *idev)
3101 {
3102 	struct inet6_ifaddr *ifp;
3103 
3104 	read_lock_bh(&idev->lock);
3105 	list_for_each_entry(ifp, &idev->addr_list, if_list) {
3106 		spin_lock(&ifp->lock);
3107 		if (ifp->flags & IFA_F_TENTATIVE &&
3108 		    ifp->state == INET6_IFADDR_STATE_DAD)
3109 			addrconf_dad_kick(ifp);
3110 		spin_unlock(&ifp->lock);
3111 	}
3112 	read_unlock_bh(&idev->lock);
3113 }
3114 
3115 #ifdef CONFIG_PROC_FS
3116 struct if6_iter_state {
3117 	struct seq_net_private p;
3118 	int bucket;
3119 	int offset;
3120 };
3121 
if6_get_first(struct seq_file * seq,loff_t pos)3122 static struct inet6_ifaddr *if6_get_first(struct seq_file *seq, loff_t pos)
3123 {
3124 	struct inet6_ifaddr *ifa = NULL;
3125 	struct if6_iter_state *state = seq->private;
3126 	struct net *net = seq_file_net(seq);
3127 	int p = 0;
3128 
3129 	/* initial bucket if pos is 0 */
3130 	if (pos == 0) {
3131 		state->bucket = 0;
3132 		state->offset = 0;
3133 	}
3134 
3135 	for (; state->bucket < IN6_ADDR_HSIZE; ++state->bucket) {
3136 		struct hlist_node *n;
3137 		hlist_for_each_entry_rcu_bh(ifa, n, &inet6_addr_lst[state->bucket],
3138 					 addr_lst) {
3139 			if (!net_eq(dev_net(ifa->idev->dev), net))
3140 				continue;
3141 			/* sync with offset */
3142 			if (p < state->offset) {
3143 				p++;
3144 				continue;
3145 			}
3146 			state->offset++;
3147 			return ifa;
3148 		}
3149 
3150 		/* prepare for next bucket */
3151 		state->offset = 0;
3152 		p = 0;
3153 	}
3154 	return NULL;
3155 }
3156 
if6_get_next(struct seq_file * seq,struct inet6_ifaddr * ifa)3157 static struct inet6_ifaddr *if6_get_next(struct seq_file *seq,
3158 					 struct inet6_ifaddr *ifa)
3159 {
3160 	struct if6_iter_state *state = seq->private;
3161 	struct net *net = seq_file_net(seq);
3162 	struct hlist_node *n = &ifa->addr_lst;
3163 
3164 	hlist_for_each_entry_continue_rcu_bh(ifa, n, addr_lst) {
3165 		if (!net_eq(dev_net(ifa->idev->dev), net))
3166 			continue;
3167 		state->offset++;
3168 		return ifa;
3169 	}
3170 
3171 	while (++state->bucket < IN6_ADDR_HSIZE) {
3172 		state->offset = 0;
3173 		hlist_for_each_entry_rcu_bh(ifa, n,
3174 				     &inet6_addr_lst[state->bucket], addr_lst) {
3175 			if (!net_eq(dev_net(ifa->idev->dev), net))
3176 				continue;
3177 			state->offset++;
3178 			return ifa;
3179 		}
3180 	}
3181 
3182 	return NULL;
3183 }
3184 
if6_seq_start(struct seq_file * seq,loff_t * pos)3185 static void *if6_seq_start(struct seq_file *seq, loff_t *pos)
3186 	__acquires(rcu_bh)
3187 {
3188 	rcu_read_lock_bh();
3189 	return if6_get_first(seq, *pos);
3190 }
3191 
if6_seq_next(struct seq_file * seq,void * v,loff_t * pos)3192 static void *if6_seq_next(struct seq_file *seq, void *v, loff_t *pos)
3193 {
3194 	struct inet6_ifaddr *ifa;
3195 
3196 	ifa = if6_get_next(seq, v);
3197 	++*pos;
3198 	return ifa;
3199 }
3200 
if6_seq_stop(struct seq_file * seq,void * v)3201 static void if6_seq_stop(struct seq_file *seq, void *v)
3202 	__releases(rcu_bh)
3203 {
3204 	rcu_read_unlock_bh();
3205 }
3206 
if6_seq_show(struct seq_file * seq,void * v)3207 static int if6_seq_show(struct seq_file *seq, void *v)
3208 {
3209 	struct inet6_ifaddr *ifp = (struct inet6_ifaddr *)v;
3210 	seq_printf(seq, "%pi6 %02x %02x %02x %02x %8s\n",
3211 		   &ifp->addr,
3212 		   ifp->idev->dev->ifindex,
3213 		   ifp->prefix_len,
3214 		   ifp->scope,
3215 		   ifp->flags,
3216 		   ifp->idev->dev->name);
3217 	return 0;
3218 }
3219 
3220 static const struct seq_operations if6_seq_ops = {
3221 	.start	= if6_seq_start,
3222 	.next	= if6_seq_next,
3223 	.show	= if6_seq_show,
3224 	.stop	= if6_seq_stop,
3225 };
3226 
if6_seq_open(struct inode * inode,struct file * file)3227 static int if6_seq_open(struct inode *inode, struct file *file)
3228 {
3229 	return seq_open_net(inode, file, &if6_seq_ops,
3230 			    sizeof(struct if6_iter_state));
3231 }
3232 
3233 static const struct file_operations if6_fops = {
3234 	.owner		= THIS_MODULE,
3235 	.open		= if6_seq_open,
3236 	.read		= seq_read,
3237 	.llseek		= seq_lseek,
3238 	.release	= seq_release_net,
3239 };
3240 
if6_proc_net_init(struct net * net)3241 static int __net_init if6_proc_net_init(struct net *net)
3242 {
3243 	if (!proc_net_fops_create(net, "if_inet6", S_IRUGO, &if6_fops))
3244 		return -ENOMEM;
3245 	return 0;
3246 }
3247 
if6_proc_net_exit(struct net * net)3248 static void __net_exit if6_proc_net_exit(struct net *net)
3249 {
3250        proc_net_remove(net, "if_inet6");
3251 }
3252 
3253 static struct pernet_operations if6_proc_net_ops = {
3254        .init = if6_proc_net_init,
3255        .exit = if6_proc_net_exit,
3256 };
3257 
if6_proc_init(void)3258 int __init if6_proc_init(void)
3259 {
3260 	return register_pernet_subsys(&if6_proc_net_ops);
3261 }
3262 
if6_proc_exit(void)3263 void if6_proc_exit(void)
3264 {
3265 	unregister_pernet_subsys(&if6_proc_net_ops);
3266 }
3267 #endif	/* CONFIG_PROC_FS */
3268 
3269 #if defined(CONFIG_IPV6_MIP6) || defined(CONFIG_IPV6_MIP6_MODULE)
3270 /* Check if address is a home address configured on any interface. */
ipv6_chk_home_addr(struct net * net,const struct in6_addr * addr)3271 int ipv6_chk_home_addr(struct net *net, const struct in6_addr *addr)
3272 {
3273 	int ret = 0;
3274 	struct inet6_ifaddr *ifp = NULL;
3275 	struct hlist_node *n;
3276 	unsigned int hash = ipv6_addr_hash(addr);
3277 
3278 	rcu_read_lock_bh();
3279 	hlist_for_each_entry_rcu_bh(ifp, n, &inet6_addr_lst[hash], addr_lst) {
3280 		if (!net_eq(dev_net(ifp->idev->dev), net))
3281 			continue;
3282 		if (ipv6_addr_equal(&ifp->addr, addr) &&
3283 		    (ifp->flags & IFA_F_HOMEADDRESS)) {
3284 			ret = 1;
3285 			break;
3286 		}
3287 	}
3288 	rcu_read_unlock_bh();
3289 	return ret;
3290 }
3291 #endif
3292 
3293 /*
3294  *	Periodic address status verification
3295  */
3296 
addrconf_verify(unsigned long foo)3297 static void addrconf_verify(unsigned long foo)
3298 {
3299 	unsigned long now, next, next_sec, next_sched;
3300 	struct inet6_ifaddr *ifp;
3301 	struct hlist_node *node;
3302 	int i;
3303 
3304 	rcu_read_lock_bh();
3305 	spin_lock(&addrconf_verify_lock);
3306 	now = jiffies;
3307 	next = round_jiffies_up(now + ADDR_CHECK_FREQUENCY);
3308 
3309 	del_timer(&addr_chk_timer);
3310 
3311 	for (i = 0; i < IN6_ADDR_HSIZE; i++) {
3312 restart:
3313 		hlist_for_each_entry_rcu_bh(ifp, node,
3314 					 &inet6_addr_lst[i], addr_lst) {
3315 			unsigned long age;
3316 
3317 			if (ifp->flags & IFA_F_PERMANENT)
3318 				continue;
3319 
3320 			spin_lock(&ifp->lock);
3321 			/* We try to batch several events at once. */
3322 			age = (now - ifp->tstamp + ADDRCONF_TIMER_FUZZ_MINUS) / HZ;
3323 
3324 			if (ifp->valid_lft != INFINITY_LIFE_TIME &&
3325 			    age >= ifp->valid_lft) {
3326 				spin_unlock(&ifp->lock);
3327 				in6_ifa_hold(ifp);
3328 				ipv6_del_addr(ifp);
3329 				goto restart;
3330 			} else if (ifp->prefered_lft == INFINITY_LIFE_TIME) {
3331 				spin_unlock(&ifp->lock);
3332 				continue;
3333 			} else if (age >= ifp->prefered_lft) {
3334 				/* jiffies - ifp->tstamp > age >= ifp->prefered_lft */
3335 				int deprecate = 0;
3336 
3337 				if (!(ifp->flags&IFA_F_DEPRECATED)) {
3338 					deprecate = 1;
3339 					ifp->flags |= IFA_F_DEPRECATED;
3340 				}
3341 
3342 				if (time_before(ifp->tstamp + ifp->valid_lft * HZ, next))
3343 					next = ifp->tstamp + ifp->valid_lft * HZ;
3344 
3345 				spin_unlock(&ifp->lock);
3346 
3347 				if (deprecate) {
3348 					in6_ifa_hold(ifp);
3349 
3350 					ipv6_ifa_notify(0, ifp);
3351 					in6_ifa_put(ifp);
3352 					goto restart;
3353 				}
3354 #ifdef CONFIG_IPV6_PRIVACY
3355 			} else if ((ifp->flags&IFA_F_TEMPORARY) &&
3356 				   !(ifp->flags&IFA_F_TENTATIVE)) {
3357 				unsigned long regen_advance = ifp->idev->cnf.regen_max_retry *
3358 					ifp->idev->cnf.dad_transmits *
3359 					ifp->idev->nd_parms->retrans_time / HZ;
3360 
3361 				if (age >= ifp->prefered_lft - regen_advance) {
3362 					struct inet6_ifaddr *ifpub = ifp->ifpub;
3363 					if (time_before(ifp->tstamp + ifp->prefered_lft * HZ, next))
3364 						next = ifp->tstamp + ifp->prefered_lft * HZ;
3365 					if (!ifp->regen_count && ifpub) {
3366 						ifp->regen_count++;
3367 						in6_ifa_hold(ifp);
3368 						in6_ifa_hold(ifpub);
3369 						spin_unlock(&ifp->lock);
3370 
3371 						spin_lock(&ifpub->lock);
3372 						ifpub->regen_count = 0;
3373 						spin_unlock(&ifpub->lock);
3374 						ipv6_create_tempaddr(ifpub, ifp);
3375 						in6_ifa_put(ifpub);
3376 						in6_ifa_put(ifp);
3377 						goto restart;
3378 					}
3379 				} else if (time_before(ifp->tstamp + ifp->prefered_lft * HZ - regen_advance * HZ, next))
3380 					next = ifp->tstamp + ifp->prefered_lft * HZ - regen_advance * HZ;
3381 				spin_unlock(&ifp->lock);
3382 #endif
3383 			} else {
3384 				/* ifp->prefered_lft <= ifp->valid_lft */
3385 				if (time_before(ifp->tstamp + ifp->prefered_lft * HZ, next))
3386 					next = ifp->tstamp + ifp->prefered_lft * HZ;
3387 				spin_unlock(&ifp->lock);
3388 			}
3389 		}
3390 	}
3391 
3392 	next_sec = round_jiffies_up(next);
3393 	next_sched = next;
3394 
3395 	/* If rounded timeout is accurate enough, accept it. */
3396 	if (time_before(next_sec, next + ADDRCONF_TIMER_FUZZ))
3397 		next_sched = next_sec;
3398 
3399 	/* And minimum interval is ADDRCONF_TIMER_FUZZ_MAX. */
3400 	if (time_before(next_sched, jiffies + ADDRCONF_TIMER_FUZZ_MAX))
3401 		next_sched = jiffies + ADDRCONF_TIMER_FUZZ_MAX;
3402 
3403 	ADBG((KERN_DEBUG "now = %lu, schedule = %lu, rounded schedule = %lu => %lu\n",
3404 	      now, next, next_sec, next_sched));
3405 
3406 	addr_chk_timer.expires = next_sched;
3407 	add_timer(&addr_chk_timer);
3408 	spin_unlock(&addrconf_verify_lock);
3409 	rcu_read_unlock_bh();
3410 }
3411 
extract_addr(struct nlattr * addr,struct nlattr * local)3412 static struct in6_addr *extract_addr(struct nlattr *addr, struct nlattr *local)
3413 {
3414 	struct in6_addr *pfx = NULL;
3415 
3416 	if (addr)
3417 		pfx = nla_data(addr);
3418 
3419 	if (local) {
3420 		if (pfx && nla_memcmp(local, pfx, sizeof(*pfx)))
3421 			pfx = NULL;
3422 		else
3423 			pfx = nla_data(local);
3424 	}
3425 
3426 	return pfx;
3427 }
3428 
3429 static const struct nla_policy ifa_ipv6_policy[IFA_MAX+1] = {
3430 	[IFA_ADDRESS]		= { .len = sizeof(struct in6_addr) },
3431 	[IFA_LOCAL]		= { .len = sizeof(struct in6_addr) },
3432 	[IFA_CACHEINFO]		= { .len = sizeof(struct ifa_cacheinfo) },
3433 };
3434 
3435 static int
inet6_rtm_deladdr(struct sk_buff * skb,struct nlmsghdr * nlh,void * arg)3436 inet6_rtm_deladdr(struct sk_buff *skb, struct nlmsghdr *nlh, void *arg)
3437 {
3438 	struct net *net = sock_net(skb->sk);
3439 	struct ifaddrmsg *ifm;
3440 	struct nlattr *tb[IFA_MAX+1];
3441 	struct in6_addr *pfx;
3442 	int err;
3443 
3444 	err = nlmsg_parse(nlh, sizeof(*ifm), tb, IFA_MAX, ifa_ipv6_policy);
3445 	if (err < 0)
3446 		return err;
3447 
3448 	ifm = nlmsg_data(nlh);
3449 	pfx = extract_addr(tb[IFA_ADDRESS], tb[IFA_LOCAL]);
3450 	if (pfx == NULL)
3451 		return -EINVAL;
3452 
3453 	return inet6_addr_del(net, ifm->ifa_index, pfx, ifm->ifa_prefixlen);
3454 }
3455 
inet6_addr_modify(struct inet6_ifaddr * ifp,u8 ifa_flags,u32 prefered_lft,u32 valid_lft)3456 static int inet6_addr_modify(struct inet6_ifaddr *ifp, u8 ifa_flags,
3457 			     u32 prefered_lft, u32 valid_lft)
3458 {
3459 	u32 flags;
3460 	clock_t expires;
3461 	unsigned long timeout;
3462 
3463 	if (!valid_lft || (prefered_lft > valid_lft))
3464 		return -EINVAL;
3465 
3466 	timeout = addrconf_timeout_fixup(valid_lft, HZ);
3467 	if (addrconf_finite_timeout(timeout)) {
3468 		expires = jiffies_to_clock_t(timeout * HZ);
3469 		valid_lft = timeout;
3470 		flags = RTF_EXPIRES;
3471 	} else {
3472 		expires = 0;
3473 		flags = 0;
3474 		ifa_flags |= IFA_F_PERMANENT;
3475 	}
3476 
3477 	timeout = addrconf_timeout_fixup(prefered_lft, HZ);
3478 	if (addrconf_finite_timeout(timeout)) {
3479 		if (timeout == 0)
3480 			ifa_flags |= IFA_F_DEPRECATED;
3481 		prefered_lft = timeout;
3482 	}
3483 
3484 	spin_lock_bh(&ifp->lock);
3485 	ifp->flags = (ifp->flags & ~(IFA_F_DEPRECATED | IFA_F_PERMANENT | IFA_F_NODAD | IFA_F_HOMEADDRESS)) | ifa_flags;
3486 	ifp->tstamp = jiffies;
3487 	ifp->valid_lft = valid_lft;
3488 	ifp->prefered_lft = prefered_lft;
3489 
3490 	spin_unlock_bh(&ifp->lock);
3491 	if (!(ifp->flags&IFA_F_TENTATIVE))
3492 		ipv6_ifa_notify(0, ifp);
3493 
3494 	addrconf_prefix_route(&ifp->addr, ifp->prefix_len, ifp->idev->dev,
3495 			      expires, flags);
3496 	addrconf_verify(0);
3497 
3498 	return 0;
3499 }
3500 
3501 static int
inet6_rtm_newaddr(struct sk_buff * skb,struct nlmsghdr * nlh,void * arg)3502 inet6_rtm_newaddr(struct sk_buff *skb, struct nlmsghdr *nlh, void *arg)
3503 {
3504 	struct net *net = sock_net(skb->sk);
3505 	struct ifaddrmsg *ifm;
3506 	struct nlattr *tb[IFA_MAX+1];
3507 	struct in6_addr *pfx;
3508 	struct inet6_ifaddr *ifa;
3509 	struct net_device *dev;
3510 	u32 valid_lft = INFINITY_LIFE_TIME, preferred_lft = INFINITY_LIFE_TIME;
3511 	u8 ifa_flags;
3512 	int err;
3513 
3514 	err = nlmsg_parse(nlh, sizeof(*ifm), tb, IFA_MAX, ifa_ipv6_policy);
3515 	if (err < 0)
3516 		return err;
3517 
3518 	ifm = nlmsg_data(nlh);
3519 	pfx = extract_addr(tb[IFA_ADDRESS], tb[IFA_LOCAL]);
3520 	if (pfx == NULL)
3521 		return -EINVAL;
3522 
3523 	if (tb[IFA_CACHEINFO]) {
3524 		struct ifa_cacheinfo *ci;
3525 
3526 		ci = nla_data(tb[IFA_CACHEINFO]);
3527 		valid_lft = ci->ifa_valid;
3528 		preferred_lft = ci->ifa_prefered;
3529 	} else {
3530 		preferred_lft = INFINITY_LIFE_TIME;
3531 		valid_lft = INFINITY_LIFE_TIME;
3532 	}
3533 
3534 	dev =  __dev_get_by_index(net, ifm->ifa_index);
3535 	if (dev == NULL)
3536 		return -ENODEV;
3537 
3538 	/* We ignore other flags so far. */
3539 	ifa_flags = ifm->ifa_flags & (IFA_F_NODAD | IFA_F_HOMEADDRESS);
3540 
3541 	ifa = ipv6_get_ifaddr(net, pfx, dev, 1);
3542 	if (ifa == NULL) {
3543 		/*
3544 		 * It would be best to check for !NLM_F_CREATE here but
3545 		 * userspace alreay relies on not having to provide this.
3546 		 */
3547 		return inet6_addr_add(net, ifm->ifa_index, pfx,
3548 				      ifm->ifa_prefixlen, ifa_flags,
3549 				      preferred_lft, valid_lft);
3550 	}
3551 
3552 	if (nlh->nlmsg_flags & NLM_F_EXCL ||
3553 	    !(nlh->nlmsg_flags & NLM_F_REPLACE))
3554 		err = -EEXIST;
3555 	else
3556 		err = inet6_addr_modify(ifa, ifa_flags, preferred_lft, valid_lft);
3557 
3558 	in6_ifa_put(ifa);
3559 
3560 	return err;
3561 }
3562 
put_ifaddrmsg(struct nlmsghdr * nlh,u8 prefixlen,u8 flags,u8 scope,int ifindex)3563 static void put_ifaddrmsg(struct nlmsghdr *nlh, u8 prefixlen, u8 flags,
3564 			  u8 scope, int ifindex)
3565 {
3566 	struct ifaddrmsg *ifm;
3567 
3568 	ifm = nlmsg_data(nlh);
3569 	ifm->ifa_family = AF_INET6;
3570 	ifm->ifa_prefixlen = prefixlen;
3571 	ifm->ifa_flags = flags;
3572 	ifm->ifa_scope = scope;
3573 	ifm->ifa_index = ifindex;
3574 }
3575 
put_cacheinfo(struct sk_buff * skb,unsigned long cstamp,unsigned long tstamp,u32 preferred,u32 valid)3576 static int put_cacheinfo(struct sk_buff *skb, unsigned long cstamp,
3577 			 unsigned long tstamp, u32 preferred, u32 valid)
3578 {
3579 	struct ifa_cacheinfo ci;
3580 
3581 	ci.cstamp = cstamp_delta(cstamp);
3582 	ci.tstamp = cstamp_delta(tstamp);
3583 	ci.ifa_prefered = preferred;
3584 	ci.ifa_valid = valid;
3585 
3586 	return nla_put(skb, IFA_CACHEINFO, sizeof(ci), &ci);
3587 }
3588 
rt_scope(int ifa_scope)3589 static inline int rt_scope(int ifa_scope)
3590 {
3591 	if (ifa_scope & IFA_HOST)
3592 		return RT_SCOPE_HOST;
3593 	else if (ifa_scope & IFA_LINK)
3594 		return RT_SCOPE_LINK;
3595 	else if (ifa_scope & IFA_SITE)
3596 		return RT_SCOPE_SITE;
3597 	else
3598 		return RT_SCOPE_UNIVERSE;
3599 }
3600 
inet6_ifaddr_msgsize(void)3601 static inline int inet6_ifaddr_msgsize(void)
3602 {
3603 	return NLMSG_ALIGN(sizeof(struct ifaddrmsg))
3604 	       + nla_total_size(16) /* IFA_ADDRESS */
3605 	       + nla_total_size(sizeof(struct ifa_cacheinfo));
3606 }
3607 
inet6_fill_ifaddr(struct sk_buff * skb,struct inet6_ifaddr * ifa,u32 pid,u32 seq,int event,unsigned int flags)3608 static int inet6_fill_ifaddr(struct sk_buff *skb, struct inet6_ifaddr *ifa,
3609 			     u32 pid, u32 seq, int event, unsigned int flags)
3610 {
3611 	struct nlmsghdr  *nlh;
3612 	u32 preferred, valid;
3613 
3614 	nlh = nlmsg_put(skb, pid, seq, event, sizeof(struct ifaddrmsg), flags);
3615 	if (nlh == NULL)
3616 		return -EMSGSIZE;
3617 
3618 	put_ifaddrmsg(nlh, ifa->prefix_len, ifa->flags, rt_scope(ifa->scope),
3619 		      ifa->idev->dev->ifindex);
3620 
3621 	if (!(ifa->flags&IFA_F_PERMANENT)) {
3622 		preferred = ifa->prefered_lft;
3623 		valid = ifa->valid_lft;
3624 		if (preferred != INFINITY_LIFE_TIME) {
3625 			long tval = (jiffies - ifa->tstamp)/HZ;
3626 			if (preferred > tval)
3627 				preferred -= tval;
3628 			else
3629 				preferred = 0;
3630 			if (valid != INFINITY_LIFE_TIME) {
3631 				if (valid > tval)
3632 					valid -= tval;
3633 				else
3634 					valid = 0;
3635 			}
3636 		}
3637 	} else {
3638 		preferred = INFINITY_LIFE_TIME;
3639 		valid = INFINITY_LIFE_TIME;
3640 	}
3641 
3642 	if (nla_put(skb, IFA_ADDRESS, 16, &ifa->addr) < 0 ||
3643 	    put_cacheinfo(skb, ifa->cstamp, ifa->tstamp, preferred, valid) < 0) {
3644 		nlmsg_cancel(skb, nlh);
3645 		return -EMSGSIZE;
3646 	}
3647 
3648 	return nlmsg_end(skb, nlh);
3649 }
3650 
inet6_fill_ifmcaddr(struct sk_buff * skb,struct ifmcaddr6 * ifmca,u32 pid,u32 seq,int event,u16 flags)3651 static int inet6_fill_ifmcaddr(struct sk_buff *skb, struct ifmcaddr6 *ifmca,
3652 				u32 pid, u32 seq, int event, u16 flags)
3653 {
3654 	struct nlmsghdr  *nlh;
3655 	u8 scope = RT_SCOPE_UNIVERSE;
3656 	int ifindex = ifmca->idev->dev->ifindex;
3657 
3658 	if (ipv6_addr_scope(&ifmca->mca_addr) & IFA_SITE)
3659 		scope = RT_SCOPE_SITE;
3660 
3661 	nlh = nlmsg_put(skb, pid, seq, event, sizeof(struct ifaddrmsg), flags);
3662 	if (nlh == NULL)
3663 		return -EMSGSIZE;
3664 
3665 	put_ifaddrmsg(nlh, 128, IFA_F_PERMANENT, scope, ifindex);
3666 	if (nla_put(skb, IFA_MULTICAST, 16, &ifmca->mca_addr) < 0 ||
3667 	    put_cacheinfo(skb, ifmca->mca_cstamp, ifmca->mca_tstamp,
3668 			  INFINITY_LIFE_TIME, INFINITY_LIFE_TIME) < 0) {
3669 		nlmsg_cancel(skb, nlh);
3670 		return -EMSGSIZE;
3671 	}
3672 
3673 	return nlmsg_end(skb, nlh);
3674 }
3675 
inet6_fill_ifacaddr(struct sk_buff * skb,struct ifacaddr6 * ifaca,u32 pid,u32 seq,int event,unsigned int flags)3676 static int inet6_fill_ifacaddr(struct sk_buff *skb, struct ifacaddr6 *ifaca,
3677 				u32 pid, u32 seq, int event, unsigned int flags)
3678 {
3679 	struct nlmsghdr  *nlh;
3680 	u8 scope = RT_SCOPE_UNIVERSE;
3681 	int ifindex = ifaca->aca_idev->dev->ifindex;
3682 
3683 	if (ipv6_addr_scope(&ifaca->aca_addr) & IFA_SITE)
3684 		scope = RT_SCOPE_SITE;
3685 
3686 	nlh = nlmsg_put(skb, pid, seq, event, sizeof(struct ifaddrmsg), flags);
3687 	if (nlh == NULL)
3688 		return -EMSGSIZE;
3689 
3690 	put_ifaddrmsg(nlh, 128, IFA_F_PERMANENT, scope, ifindex);
3691 	if (nla_put(skb, IFA_ANYCAST, 16, &ifaca->aca_addr) < 0 ||
3692 	    put_cacheinfo(skb, ifaca->aca_cstamp, ifaca->aca_tstamp,
3693 			  INFINITY_LIFE_TIME, INFINITY_LIFE_TIME) < 0) {
3694 		nlmsg_cancel(skb, nlh);
3695 		return -EMSGSIZE;
3696 	}
3697 
3698 	return nlmsg_end(skb, nlh);
3699 }
3700 
3701 enum addr_type_t {
3702 	UNICAST_ADDR,
3703 	MULTICAST_ADDR,
3704 	ANYCAST_ADDR,
3705 };
3706 
3707 /* called with rcu_read_lock() */
in6_dump_addrs(struct inet6_dev * idev,struct sk_buff * skb,struct netlink_callback * cb,enum addr_type_t type,int s_ip_idx,int * p_ip_idx)3708 static int in6_dump_addrs(struct inet6_dev *idev, struct sk_buff *skb,
3709 			  struct netlink_callback *cb, enum addr_type_t type,
3710 			  int s_ip_idx, int *p_ip_idx)
3711 {
3712 	struct ifmcaddr6 *ifmca;
3713 	struct ifacaddr6 *ifaca;
3714 	int err = 1;
3715 	int ip_idx = *p_ip_idx;
3716 
3717 	read_lock_bh(&idev->lock);
3718 	switch (type) {
3719 	case UNICAST_ADDR: {
3720 		struct inet6_ifaddr *ifa;
3721 
3722 		/* unicast address incl. temp addr */
3723 		list_for_each_entry(ifa, &idev->addr_list, if_list) {
3724 			if (++ip_idx < s_ip_idx)
3725 				continue;
3726 			err = inet6_fill_ifaddr(skb, ifa,
3727 						NETLINK_CB(cb->skb).pid,
3728 						cb->nlh->nlmsg_seq,
3729 						RTM_NEWADDR,
3730 						NLM_F_MULTI);
3731 			if (err <= 0)
3732 				break;
3733 		}
3734 		break;
3735 	}
3736 	case MULTICAST_ADDR:
3737 		/* multicast address */
3738 		for (ifmca = idev->mc_list; ifmca;
3739 		     ifmca = ifmca->next, ip_idx++) {
3740 			if (ip_idx < s_ip_idx)
3741 				continue;
3742 			err = inet6_fill_ifmcaddr(skb, ifmca,
3743 						  NETLINK_CB(cb->skb).pid,
3744 						  cb->nlh->nlmsg_seq,
3745 						  RTM_GETMULTICAST,
3746 						  NLM_F_MULTI);
3747 			if (err <= 0)
3748 				break;
3749 		}
3750 		break;
3751 	case ANYCAST_ADDR:
3752 		/* anycast address */
3753 		for (ifaca = idev->ac_list; ifaca;
3754 		     ifaca = ifaca->aca_next, ip_idx++) {
3755 			if (ip_idx < s_ip_idx)
3756 				continue;
3757 			err = inet6_fill_ifacaddr(skb, ifaca,
3758 						  NETLINK_CB(cb->skb).pid,
3759 						  cb->nlh->nlmsg_seq,
3760 						  RTM_GETANYCAST,
3761 						  NLM_F_MULTI);
3762 			if (err <= 0)
3763 				break;
3764 		}
3765 		break;
3766 	default:
3767 		break;
3768 	}
3769 	read_unlock_bh(&idev->lock);
3770 	*p_ip_idx = ip_idx;
3771 	return err;
3772 }
3773 
inet6_dump_addr(struct sk_buff * skb,struct netlink_callback * cb,enum addr_type_t type)3774 static int inet6_dump_addr(struct sk_buff *skb, struct netlink_callback *cb,
3775 			   enum addr_type_t type)
3776 {
3777 	struct net *net = sock_net(skb->sk);
3778 	int h, s_h;
3779 	int idx, ip_idx;
3780 	int s_idx, s_ip_idx;
3781 	struct net_device *dev;
3782 	struct inet6_dev *idev;
3783 	struct hlist_head *head;
3784 	struct hlist_node *node;
3785 
3786 	s_h = cb->args[0];
3787 	s_idx = idx = cb->args[1];
3788 	s_ip_idx = ip_idx = cb->args[2];
3789 
3790 	rcu_read_lock();
3791 	for (h = s_h; h < NETDEV_HASHENTRIES; h++, s_idx = 0) {
3792 		idx = 0;
3793 		head = &net->dev_index_head[h];
3794 		hlist_for_each_entry_rcu(dev, node, head, index_hlist) {
3795 			if (idx < s_idx)
3796 				goto cont;
3797 			if (h > s_h || idx > s_idx)
3798 				s_ip_idx = 0;
3799 			ip_idx = 0;
3800 			idev = __in6_dev_get(dev);
3801 			if (!idev)
3802 				goto cont;
3803 
3804 			if (in6_dump_addrs(idev, skb, cb, type,
3805 					   s_ip_idx, &ip_idx) <= 0)
3806 				goto done;
3807 cont:
3808 			idx++;
3809 		}
3810 	}
3811 done:
3812 	rcu_read_unlock();
3813 	cb->args[0] = h;
3814 	cb->args[1] = idx;
3815 	cb->args[2] = ip_idx;
3816 
3817 	return skb->len;
3818 }
3819 
inet6_dump_ifaddr(struct sk_buff * skb,struct netlink_callback * cb)3820 static int inet6_dump_ifaddr(struct sk_buff *skb, struct netlink_callback *cb)
3821 {
3822 	enum addr_type_t type = UNICAST_ADDR;
3823 
3824 	return inet6_dump_addr(skb, cb, type);
3825 }
3826 
inet6_dump_ifmcaddr(struct sk_buff * skb,struct netlink_callback * cb)3827 static int inet6_dump_ifmcaddr(struct sk_buff *skb, struct netlink_callback *cb)
3828 {
3829 	enum addr_type_t type = MULTICAST_ADDR;
3830 
3831 	return inet6_dump_addr(skb, cb, type);
3832 }
3833 
3834 
inet6_dump_ifacaddr(struct sk_buff * skb,struct netlink_callback * cb)3835 static int inet6_dump_ifacaddr(struct sk_buff *skb, struct netlink_callback *cb)
3836 {
3837 	enum addr_type_t type = ANYCAST_ADDR;
3838 
3839 	return inet6_dump_addr(skb, cb, type);
3840 }
3841 
inet6_rtm_getaddr(struct sk_buff * in_skb,struct nlmsghdr * nlh,void * arg)3842 static int inet6_rtm_getaddr(struct sk_buff *in_skb, struct nlmsghdr* nlh,
3843 			     void *arg)
3844 {
3845 	struct net *net = sock_net(in_skb->sk);
3846 	struct ifaddrmsg *ifm;
3847 	struct nlattr *tb[IFA_MAX+1];
3848 	struct in6_addr *addr = NULL;
3849 	struct net_device *dev = NULL;
3850 	struct inet6_ifaddr *ifa;
3851 	struct sk_buff *skb;
3852 	int err;
3853 
3854 	err = nlmsg_parse(nlh, sizeof(*ifm), tb, IFA_MAX, ifa_ipv6_policy);
3855 	if (err < 0)
3856 		goto errout;
3857 
3858 	addr = extract_addr(tb[IFA_ADDRESS], tb[IFA_LOCAL]);
3859 	if (addr == NULL) {
3860 		err = -EINVAL;
3861 		goto errout;
3862 	}
3863 
3864 	ifm = nlmsg_data(nlh);
3865 	if (ifm->ifa_index)
3866 		dev = __dev_get_by_index(net, ifm->ifa_index);
3867 
3868 	ifa = ipv6_get_ifaddr(net, addr, dev, 1);
3869 	if (!ifa) {
3870 		err = -EADDRNOTAVAIL;
3871 		goto errout;
3872 	}
3873 
3874 	skb = nlmsg_new(inet6_ifaddr_msgsize(), GFP_KERNEL);
3875 	if (!skb) {
3876 		err = -ENOBUFS;
3877 		goto errout_ifa;
3878 	}
3879 
3880 	err = inet6_fill_ifaddr(skb, ifa, NETLINK_CB(in_skb).pid,
3881 				nlh->nlmsg_seq, RTM_NEWADDR, 0);
3882 	if (err < 0) {
3883 		/* -EMSGSIZE implies BUG in inet6_ifaddr_msgsize() */
3884 		WARN_ON(err == -EMSGSIZE);
3885 		kfree_skb(skb);
3886 		goto errout_ifa;
3887 	}
3888 	err = rtnl_unicast(skb, net, NETLINK_CB(in_skb).pid);
3889 errout_ifa:
3890 	in6_ifa_put(ifa);
3891 errout:
3892 	return err;
3893 }
3894 
inet6_ifa_notify(int event,struct inet6_ifaddr * ifa)3895 static void inet6_ifa_notify(int event, struct inet6_ifaddr *ifa)
3896 {
3897 	struct sk_buff *skb;
3898 	struct net *net = dev_net(ifa->idev->dev);
3899 	int err = -ENOBUFS;
3900 
3901 	skb = nlmsg_new(inet6_ifaddr_msgsize(), GFP_ATOMIC);
3902 	if (skb == NULL)
3903 		goto errout;
3904 
3905 	err = inet6_fill_ifaddr(skb, ifa, 0, 0, event, 0);
3906 	if (err < 0) {
3907 		/* -EMSGSIZE implies BUG in inet6_ifaddr_msgsize() */
3908 		WARN_ON(err == -EMSGSIZE);
3909 		kfree_skb(skb);
3910 		goto errout;
3911 	}
3912 	rtnl_notify(skb, net, 0, RTNLGRP_IPV6_IFADDR, NULL, GFP_ATOMIC);
3913 	return;
3914 errout:
3915 	if (err < 0)
3916 		rtnl_set_sk_err(net, RTNLGRP_IPV6_IFADDR, err);
3917 }
3918 
ipv6_store_devconf(struct ipv6_devconf * cnf,__s32 * array,int bytes)3919 static inline void ipv6_store_devconf(struct ipv6_devconf *cnf,
3920 				__s32 *array, int bytes)
3921 {
3922 	BUG_ON(bytes < (DEVCONF_MAX * 4));
3923 
3924 	memset(array, 0, bytes);
3925 	array[DEVCONF_FORWARDING] = cnf->forwarding;
3926 	array[DEVCONF_HOPLIMIT] = cnf->hop_limit;
3927 	array[DEVCONF_MTU6] = cnf->mtu6;
3928 	array[DEVCONF_ACCEPT_RA] = cnf->accept_ra;
3929 	array[DEVCONF_ACCEPT_REDIRECTS] = cnf->accept_redirects;
3930 	array[DEVCONF_AUTOCONF] = cnf->autoconf;
3931 	array[DEVCONF_DAD_TRANSMITS] = cnf->dad_transmits;
3932 	array[DEVCONF_RTR_SOLICITS] = cnf->rtr_solicits;
3933 	array[DEVCONF_RTR_SOLICIT_INTERVAL] =
3934 		jiffies_to_msecs(cnf->rtr_solicit_interval);
3935 	array[DEVCONF_RTR_SOLICIT_DELAY] =
3936 		jiffies_to_msecs(cnf->rtr_solicit_delay);
3937 	array[DEVCONF_FORCE_MLD_VERSION] = cnf->force_mld_version;
3938 #ifdef CONFIG_IPV6_PRIVACY
3939 	array[DEVCONF_USE_TEMPADDR] = cnf->use_tempaddr;
3940 	array[DEVCONF_TEMP_VALID_LFT] = cnf->temp_valid_lft;
3941 	array[DEVCONF_TEMP_PREFERED_LFT] = cnf->temp_prefered_lft;
3942 	array[DEVCONF_REGEN_MAX_RETRY] = cnf->regen_max_retry;
3943 	array[DEVCONF_MAX_DESYNC_FACTOR] = cnf->max_desync_factor;
3944 #endif
3945 	array[DEVCONF_MAX_ADDRESSES] = cnf->max_addresses;
3946 	array[DEVCONF_ACCEPT_RA_DEFRTR] = cnf->accept_ra_defrtr;
3947 	array[DEVCONF_ACCEPT_RA_PINFO] = cnf->accept_ra_pinfo;
3948 #ifdef CONFIG_IPV6_ROUTER_PREF
3949 	array[DEVCONF_ACCEPT_RA_RTR_PREF] = cnf->accept_ra_rtr_pref;
3950 	array[DEVCONF_RTR_PROBE_INTERVAL] =
3951 		jiffies_to_msecs(cnf->rtr_probe_interval);
3952 #ifdef CONFIG_IPV6_ROUTE_INFO
3953 	array[DEVCONF_ACCEPT_RA_RT_INFO_MAX_PLEN] = cnf->accept_ra_rt_info_max_plen;
3954 #endif
3955 #endif
3956 	array[DEVCONF_PROXY_NDP] = cnf->proxy_ndp;
3957 	array[DEVCONF_ACCEPT_SOURCE_ROUTE] = cnf->accept_source_route;
3958 #ifdef CONFIG_IPV6_OPTIMISTIC_DAD
3959 	array[DEVCONF_OPTIMISTIC_DAD] = cnf->optimistic_dad;
3960 #endif
3961 #ifdef CONFIG_IPV6_MROUTE
3962 	array[DEVCONF_MC_FORWARDING] = cnf->mc_forwarding;
3963 #endif
3964 	array[DEVCONF_DISABLE_IPV6] = cnf->disable_ipv6;
3965 	array[DEVCONF_ACCEPT_DAD] = cnf->accept_dad;
3966 	array[DEVCONF_FORCE_TLLAO] = cnf->force_tllao;
3967 }
3968 
inet6_ifla6_size(void)3969 static inline size_t inet6_ifla6_size(void)
3970 {
3971 	return nla_total_size(4) /* IFLA_INET6_FLAGS */
3972 	     + nla_total_size(sizeof(struct ifla_cacheinfo))
3973 	     + nla_total_size(DEVCONF_MAX * 4) /* IFLA_INET6_CONF */
3974 	     + nla_total_size(IPSTATS_MIB_MAX * 8) /* IFLA_INET6_STATS */
3975 	     + nla_total_size(ICMP6_MIB_MAX * 8); /* IFLA_INET6_ICMP6STATS */
3976 }
3977 
inet6_if_nlmsg_size(void)3978 static inline size_t inet6_if_nlmsg_size(void)
3979 {
3980 	return NLMSG_ALIGN(sizeof(struct ifinfomsg))
3981 	       + nla_total_size(IFNAMSIZ) /* IFLA_IFNAME */
3982 	       + nla_total_size(MAX_ADDR_LEN) /* IFLA_ADDRESS */
3983 	       + nla_total_size(4) /* IFLA_MTU */
3984 	       + nla_total_size(4) /* IFLA_LINK */
3985 	       + nla_total_size(inet6_ifla6_size()); /* IFLA_PROTINFO */
3986 }
3987 
__snmp6_fill_statsdev(u64 * stats,atomic_long_t * mib,int items,int bytes)3988 static inline void __snmp6_fill_statsdev(u64 *stats, atomic_long_t *mib,
3989 				      int items, int bytes)
3990 {
3991 	int i;
3992 	int pad = bytes - sizeof(u64) * items;
3993 	BUG_ON(pad < 0);
3994 
3995 	/* Use put_unaligned() because stats may not be aligned for u64. */
3996 	put_unaligned(items, &stats[0]);
3997 	for (i = 1; i < items; i++)
3998 		put_unaligned(atomic_long_read(&mib[i]), &stats[i]);
3999 
4000 	memset(&stats[items], 0, pad);
4001 }
4002 
__snmp6_fill_stats64(u64 * stats,void __percpu ** mib,int items,int bytes,size_t syncpoff)4003 static inline void __snmp6_fill_stats64(u64 *stats, void __percpu **mib,
4004 				      int items, int bytes, size_t syncpoff)
4005 {
4006 	int i;
4007 	int pad = bytes - sizeof(u64) * items;
4008 	BUG_ON(pad < 0);
4009 
4010 	/* Use put_unaligned() because stats may not be aligned for u64. */
4011 	put_unaligned(items, &stats[0]);
4012 	for (i = 1; i < items; i++)
4013 		put_unaligned(snmp_fold_field64(mib, i, syncpoff), &stats[i]);
4014 
4015 	memset(&stats[items], 0, pad);
4016 }
4017 
snmp6_fill_stats(u64 * stats,struct inet6_dev * idev,int attrtype,int bytes)4018 static void snmp6_fill_stats(u64 *stats, struct inet6_dev *idev, int attrtype,
4019 			     int bytes)
4020 {
4021 	switch (attrtype) {
4022 	case IFLA_INET6_STATS:
4023 		__snmp6_fill_stats64(stats, (void __percpu **)idev->stats.ipv6,
4024 				     IPSTATS_MIB_MAX, bytes, offsetof(struct ipstats_mib, syncp));
4025 		break;
4026 	case IFLA_INET6_ICMP6STATS:
4027 		__snmp6_fill_statsdev(stats, idev->stats.icmpv6dev->mibs, ICMP6_MIB_MAX, bytes);
4028 		break;
4029 	}
4030 }
4031 
inet6_fill_ifla6_attrs(struct sk_buff * skb,struct inet6_dev * idev)4032 static int inet6_fill_ifla6_attrs(struct sk_buff *skb, struct inet6_dev *idev)
4033 {
4034 	struct nlattr *nla;
4035 	struct ifla_cacheinfo ci;
4036 
4037 	NLA_PUT_U32(skb, IFLA_INET6_FLAGS, idev->if_flags);
4038 
4039 	ci.max_reasm_len = IPV6_MAXPLEN;
4040 	ci.tstamp = cstamp_delta(idev->tstamp);
4041 	ci.reachable_time = jiffies_to_msecs(idev->nd_parms->reachable_time);
4042 	ci.retrans_time = jiffies_to_msecs(idev->nd_parms->retrans_time);
4043 	NLA_PUT(skb, IFLA_INET6_CACHEINFO, sizeof(ci), &ci);
4044 
4045 	nla = nla_reserve(skb, IFLA_INET6_CONF, DEVCONF_MAX * sizeof(s32));
4046 	if (nla == NULL)
4047 		goto nla_put_failure;
4048 	ipv6_store_devconf(&idev->cnf, nla_data(nla), nla_len(nla));
4049 
4050 	/* XXX - MC not implemented */
4051 
4052 	nla = nla_reserve(skb, IFLA_INET6_STATS, IPSTATS_MIB_MAX * sizeof(u64));
4053 	if (nla == NULL)
4054 		goto nla_put_failure;
4055 	snmp6_fill_stats(nla_data(nla), idev, IFLA_INET6_STATS, nla_len(nla));
4056 
4057 	nla = nla_reserve(skb, IFLA_INET6_ICMP6STATS, ICMP6_MIB_MAX * sizeof(u64));
4058 	if (nla == NULL)
4059 		goto nla_put_failure;
4060 	snmp6_fill_stats(nla_data(nla), idev, IFLA_INET6_ICMP6STATS, nla_len(nla));
4061 
4062 	return 0;
4063 
4064 nla_put_failure:
4065 	return -EMSGSIZE;
4066 }
4067 
inet6_get_link_af_size(const struct net_device * dev)4068 static size_t inet6_get_link_af_size(const struct net_device *dev)
4069 {
4070 	if (!__in6_dev_get(dev))
4071 		return 0;
4072 
4073 	return inet6_ifla6_size();
4074 }
4075 
inet6_fill_link_af(struct sk_buff * skb,const struct net_device * dev)4076 static int inet6_fill_link_af(struct sk_buff *skb, const struct net_device *dev)
4077 {
4078 	struct inet6_dev *idev = __in6_dev_get(dev);
4079 
4080 	if (!idev)
4081 		return -ENODATA;
4082 
4083 	if (inet6_fill_ifla6_attrs(skb, idev) < 0)
4084 		return -EMSGSIZE;
4085 
4086 	return 0;
4087 }
4088 
inet6_fill_ifinfo(struct sk_buff * skb,struct inet6_dev * idev,u32 pid,u32 seq,int event,unsigned int flags)4089 static int inet6_fill_ifinfo(struct sk_buff *skb, struct inet6_dev *idev,
4090 			     u32 pid, u32 seq, int event, unsigned int flags)
4091 {
4092 	struct net_device *dev = idev->dev;
4093 	struct ifinfomsg *hdr;
4094 	struct nlmsghdr *nlh;
4095 	void *protoinfo;
4096 
4097 	nlh = nlmsg_put(skb, pid, seq, event, sizeof(*hdr), flags);
4098 	if (nlh == NULL)
4099 		return -EMSGSIZE;
4100 
4101 	hdr = nlmsg_data(nlh);
4102 	hdr->ifi_family = AF_INET6;
4103 	hdr->__ifi_pad = 0;
4104 	hdr->ifi_type = dev->type;
4105 	hdr->ifi_index = dev->ifindex;
4106 	hdr->ifi_flags = dev_get_flags(dev);
4107 	hdr->ifi_change = 0;
4108 
4109 	NLA_PUT_STRING(skb, IFLA_IFNAME, dev->name);
4110 
4111 	if (dev->addr_len)
4112 		NLA_PUT(skb, IFLA_ADDRESS, dev->addr_len, dev->dev_addr);
4113 
4114 	NLA_PUT_U32(skb, IFLA_MTU, dev->mtu);
4115 	if (dev->ifindex != dev->iflink)
4116 		NLA_PUT_U32(skb, IFLA_LINK, dev->iflink);
4117 
4118 	protoinfo = nla_nest_start(skb, IFLA_PROTINFO);
4119 	if (protoinfo == NULL)
4120 		goto nla_put_failure;
4121 
4122 	if (inet6_fill_ifla6_attrs(skb, idev) < 0)
4123 		goto nla_put_failure;
4124 
4125 	nla_nest_end(skb, protoinfo);
4126 	return nlmsg_end(skb, nlh);
4127 
4128 nla_put_failure:
4129 	nlmsg_cancel(skb, nlh);
4130 	return -EMSGSIZE;
4131 }
4132 
inet6_dump_ifinfo(struct sk_buff * skb,struct netlink_callback * cb)4133 static int inet6_dump_ifinfo(struct sk_buff *skb, struct netlink_callback *cb)
4134 {
4135 	struct net *net = sock_net(skb->sk);
4136 	int h, s_h;
4137 	int idx = 0, s_idx;
4138 	struct net_device *dev;
4139 	struct inet6_dev *idev;
4140 	struct hlist_head *head;
4141 	struct hlist_node *node;
4142 
4143 	s_h = cb->args[0];
4144 	s_idx = cb->args[1];
4145 
4146 	rcu_read_lock();
4147 	for (h = s_h; h < NETDEV_HASHENTRIES; h++, s_idx = 0) {
4148 		idx = 0;
4149 		head = &net->dev_index_head[h];
4150 		hlist_for_each_entry_rcu(dev, node, head, index_hlist) {
4151 			if (idx < s_idx)
4152 				goto cont;
4153 			idev = __in6_dev_get(dev);
4154 			if (!idev)
4155 				goto cont;
4156 			if (inet6_fill_ifinfo(skb, idev,
4157 					      NETLINK_CB(cb->skb).pid,
4158 					      cb->nlh->nlmsg_seq,
4159 					      RTM_NEWLINK, NLM_F_MULTI) <= 0)
4160 				goto out;
4161 cont:
4162 			idx++;
4163 		}
4164 	}
4165 out:
4166 	rcu_read_unlock();
4167 	cb->args[1] = idx;
4168 	cb->args[0] = h;
4169 
4170 	return skb->len;
4171 }
4172 
inet6_ifinfo_notify(int event,struct inet6_dev * idev)4173 void inet6_ifinfo_notify(int event, struct inet6_dev *idev)
4174 {
4175 	struct sk_buff *skb;
4176 	struct net *net = dev_net(idev->dev);
4177 	int err = -ENOBUFS;
4178 
4179 	skb = nlmsg_new(inet6_if_nlmsg_size(), GFP_ATOMIC);
4180 	if (skb == NULL)
4181 		goto errout;
4182 
4183 	err = inet6_fill_ifinfo(skb, idev, 0, 0, event, 0);
4184 	if (err < 0) {
4185 		/* -EMSGSIZE implies BUG in inet6_if_nlmsg_size() */
4186 		WARN_ON(err == -EMSGSIZE);
4187 		kfree_skb(skb);
4188 		goto errout;
4189 	}
4190 	rtnl_notify(skb, net, 0, RTNLGRP_IPV6_IFINFO, NULL, GFP_ATOMIC);
4191 	return;
4192 errout:
4193 	if (err < 0)
4194 		rtnl_set_sk_err(net, RTNLGRP_IPV6_IFINFO, err);
4195 }
4196 
inet6_prefix_nlmsg_size(void)4197 static inline size_t inet6_prefix_nlmsg_size(void)
4198 {
4199 	return NLMSG_ALIGN(sizeof(struct prefixmsg))
4200 	       + nla_total_size(sizeof(struct in6_addr))
4201 	       + nla_total_size(sizeof(struct prefix_cacheinfo));
4202 }
4203 
inet6_fill_prefix(struct sk_buff * skb,struct inet6_dev * idev,struct prefix_info * pinfo,u32 pid,u32 seq,int event,unsigned int flags)4204 static int inet6_fill_prefix(struct sk_buff *skb, struct inet6_dev *idev,
4205 			     struct prefix_info *pinfo, u32 pid, u32 seq,
4206 			     int event, unsigned int flags)
4207 {
4208 	struct prefixmsg *pmsg;
4209 	struct nlmsghdr *nlh;
4210 	struct prefix_cacheinfo	ci;
4211 
4212 	nlh = nlmsg_put(skb, pid, seq, event, sizeof(*pmsg), flags);
4213 	if (nlh == NULL)
4214 		return -EMSGSIZE;
4215 
4216 	pmsg = nlmsg_data(nlh);
4217 	pmsg->prefix_family = AF_INET6;
4218 	pmsg->prefix_pad1 = 0;
4219 	pmsg->prefix_pad2 = 0;
4220 	pmsg->prefix_ifindex = idev->dev->ifindex;
4221 	pmsg->prefix_len = pinfo->prefix_len;
4222 	pmsg->prefix_type = pinfo->type;
4223 	pmsg->prefix_pad3 = 0;
4224 	pmsg->prefix_flags = 0;
4225 	if (pinfo->onlink)
4226 		pmsg->prefix_flags |= IF_PREFIX_ONLINK;
4227 	if (pinfo->autoconf)
4228 		pmsg->prefix_flags |= IF_PREFIX_AUTOCONF;
4229 
4230 	NLA_PUT(skb, PREFIX_ADDRESS, sizeof(pinfo->prefix), &pinfo->prefix);
4231 
4232 	ci.preferred_time = ntohl(pinfo->prefered);
4233 	ci.valid_time = ntohl(pinfo->valid);
4234 	NLA_PUT(skb, PREFIX_CACHEINFO, sizeof(ci), &ci);
4235 
4236 	return nlmsg_end(skb, nlh);
4237 
4238 nla_put_failure:
4239 	nlmsg_cancel(skb, nlh);
4240 	return -EMSGSIZE;
4241 }
4242 
inet6_prefix_notify(int event,struct inet6_dev * idev,struct prefix_info * pinfo)4243 static void inet6_prefix_notify(int event, struct inet6_dev *idev,
4244 			 struct prefix_info *pinfo)
4245 {
4246 	struct sk_buff *skb;
4247 	struct net *net = dev_net(idev->dev);
4248 	int err = -ENOBUFS;
4249 
4250 	skb = nlmsg_new(inet6_prefix_nlmsg_size(), GFP_ATOMIC);
4251 	if (skb == NULL)
4252 		goto errout;
4253 
4254 	err = inet6_fill_prefix(skb, idev, pinfo, 0, 0, event, 0);
4255 	if (err < 0) {
4256 		/* -EMSGSIZE implies BUG in inet6_prefix_nlmsg_size() */
4257 		WARN_ON(err == -EMSGSIZE);
4258 		kfree_skb(skb);
4259 		goto errout;
4260 	}
4261 	rtnl_notify(skb, net, 0, RTNLGRP_IPV6_PREFIX, NULL, GFP_ATOMIC);
4262 	return;
4263 errout:
4264 	if (err < 0)
4265 		rtnl_set_sk_err(net, RTNLGRP_IPV6_PREFIX, err);
4266 }
4267 
__ipv6_ifa_notify(int event,struct inet6_ifaddr * ifp)4268 static void __ipv6_ifa_notify(int event, struct inet6_ifaddr *ifp)
4269 {
4270 	inet6_ifa_notify(event ? : RTM_NEWADDR, ifp);
4271 
4272 	switch (event) {
4273 	case RTM_NEWADDR:
4274 		/*
4275 		 * If the address was optimistic
4276 		 * we inserted the route at the start of
4277 		 * our DAD process, so we don't need
4278 		 * to do it again
4279 		 */
4280 		if (!(ifp->rt->rt6i_node))
4281 			ip6_ins_rt(ifp->rt);
4282 		if (ifp->idev->cnf.forwarding)
4283 			addrconf_join_anycast(ifp);
4284 		break;
4285 	case RTM_DELADDR:
4286 		if (ifp->idev->cnf.forwarding)
4287 			addrconf_leave_anycast(ifp);
4288 		addrconf_leave_solict(ifp->idev, &ifp->addr);
4289 		dst_hold(&ifp->rt->dst);
4290 
4291 		if (ip6_del_rt(ifp->rt))
4292 			dst_free(&ifp->rt->dst);
4293 		break;
4294 	}
4295 }
4296 
ipv6_ifa_notify(int event,struct inet6_ifaddr * ifp)4297 static void ipv6_ifa_notify(int event, struct inet6_ifaddr *ifp)
4298 {
4299 	rcu_read_lock_bh();
4300 	if (likely(ifp->idev->dead == 0))
4301 		__ipv6_ifa_notify(event, ifp);
4302 	rcu_read_unlock_bh();
4303 }
4304 
4305 #ifdef CONFIG_SYSCTL
4306 
4307 static
addrconf_sysctl_forward(ctl_table * ctl,int write,void __user * buffer,size_t * lenp,loff_t * ppos)4308 int addrconf_sysctl_forward(ctl_table *ctl, int write,
4309 			   void __user *buffer, size_t *lenp, loff_t *ppos)
4310 {
4311 	int *valp = ctl->data;
4312 	int val = *valp;
4313 	loff_t pos = *ppos;
4314 	ctl_table lctl;
4315 	int ret;
4316 
4317 	/*
4318 	 * ctl->data points to idev->cnf.forwarding, we should
4319 	 * not modify it until we get the rtnl lock.
4320 	 */
4321 	lctl = *ctl;
4322 	lctl.data = &val;
4323 
4324 	ret = proc_dointvec(&lctl, write, buffer, lenp, ppos);
4325 
4326 	if (write)
4327 		ret = addrconf_fixup_forwarding(ctl, valp, val);
4328 	if (ret)
4329 		*ppos = pos;
4330 	return ret;
4331 }
4332 
dev_disable_change(struct inet6_dev * idev)4333 static void dev_disable_change(struct inet6_dev *idev)
4334 {
4335 	if (!idev || !idev->dev)
4336 		return;
4337 
4338 	if (idev->cnf.disable_ipv6)
4339 		addrconf_notify(NULL, NETDEV_DOWN, idev->dev);
4340 	else
4341 		addrconf_notify(NULL, NETDEV_UP, idev->dev);
4342 }
4343 
addrconf_disable_change(struct net * net,__s32 newf)4344 static void addrconf_disable_change(struct net *net, __s32 newf)
4345 {
4346 	struct net_device *dev;
4347 	struct inet6_dev *idev;
4348 
4349 	rcu_read_lock();
4350 	for_each_netdev_rcu(net, dev) {
4351 		idev = __in6_dev_get(dev);
4352 		if (idev) {
4353 			int changed = (!idev->cnf.disable_ipv6) ^ (!newf);
4354 			idev->cnf.disable_ipv6 = newf;
4355 			if (changed)
4356 				dev_disable_change(idev);
4357 		}
4358 	}
4359 	rcu_read_unlock();
4360 }
4361 
addrconf_disable_ipv6(struct ctl_table * table,int * p,int newf)4362 static int addrconf_disable_ipv6(struct ctl_table *table, int *p, int newf)
4363 {
4364 	struct net *net;
4365 	int old;
4366 
4367 	if (!rtnl_trylock())
4368 		return restart_syscall();
4369 
4370 	net = (struct net *)table->extra2;
4371 	old = *p;
4372 	*p = newf;
4373 
4374 	if (p == &net->ipv6.devconf_dflt->disable_ipv6) {
4375 		rtnl_unlock();
4376 		return 0;
4377 	}
4378 
4379 	if (p == &net->ipv6.devconf_all->disable_ipv6) {
4380 		net->ipv6.devconf_dflt->disable_ipv6 = newf;
4381 		addrconf_disable_change(net, newf);
4382 	} else if ((!newf) ^ (!old))
4383 		dev_disable_change((struct inet6_dev *)table->extra1);
4384 
4385 	rtnl_unlock();
4386 	return 0;
4387 }
4388 
4389 static
addrconf_sysctl_disable(ctl_table * ctl,int write,void __user * buffer,size_t * lenp,loff_t * ppos)4390 int addrconf_sysctl_disable(ctl_table *ctl, int write,
4391 			    void __user *buffer, size_t *lenp, loff_t *ppos)
4392 {
4393 	int *valp = ctl->data;
4394 	int val = *valp;
4395 	loff_t pos = *ppos;
4396 	ctl_table lctl;
4397 	int ret;
4398 
4399 	/*
4400 	 * ctl->data points to idev->cnf.disable_ipv6, we should
4401 	 * not modify it until we get the rtnl lock.
4402 	 */
4403 	lctl = *ctl;
4404 	lctl.data = &val;
4405 
4406 	ret = proc_dointvec(&lctl, write, buffer, lenp, ppos);
4407 
4408 	if (write)
4409 		ret = addrconf_disable_ipv6(ctl, valp, val);
4410 	if (ret)
4411 		*ppos = pos;
4412 	return ret;
4413 }
4414 
4415 static struct addrconf_sysctl_table
4416 {
4417 	struct ctl_table_header *sysctl_header;
4418 	ctl_table addrconf_vars[DEVCONF_MAX+1];
4419 	char *dev_name;
4420 } addrconf_sysctl __read_mostly = {
4421 	.sysctl_header = NULL,
4422 	.addrconf_vars = {
4423 		{
4424 			.procname	= "forwarding",
4425 			.data		= &ipv6_devconf.forwarding,
4426 			.maxlen		= sizeof(int),
4427 			.mode		= 0644,
4428 			.proc_handler	= addrconf_sysctl_forward,
4429 		},
4430 		{
4431 			.procname	= "hop_limit",
4432 			.data		= &ipv6_devconf.hop_limit,
4433 			.maxlen		= sizeof(int),
4434 			.mode		= 0644,
4435 			.proc_handler	= proc_dointvec,
4436 		},
4437 		{
4438 			.procname	= "mtu",
4439 			.data		= &ipv6_devconf.mtu6,
4440 			.maxlen		= sizeof(int),
4441 			.mode		= 0644,
4442 			.proc_handler	= proc_dointvec,
4443 		},
4444 		{
4445 			.procname	= "accept_ra",
4446 			.data		= &ipv6_devconf.accept_ra,
4447 			.maxlen		= sizeof(int),
4448 			.mode		= 0644,
4449 			.proc_handler	= proc_dointvec,
4450 		},
4451 		{
4452 			.procname	= "accept_redirects",
4453 			.data		= &ipv6_devconf.accept_redirects,
4454 			.maxlen		= sizeof(int),
4455 			.mode		= 0644,
4456 			.proc_handler	= proc_dointvec,
4457 		},
4458 		{
4459 			.procname	= "autoconf",
4460 			.data		= &ipv6_devconf.autoconf,
4461 			.maxlen		= sizeof(int),
4462 			.mode		= 0644,
4463 			.proc_handler	= proc_dointvec,
4464 		},
4465 		{
4466 			.procname	= "dad_transmits",
4467 			.data		= &ipv6_devconf.dad_transmits,
4468 			.maxlen		= sizeof(int),
4469 			.mode		= 0644,
4470 			.proc_handler	= proc_dointvec,
4471 		},
4472 		{
4473 			.procname	= "router_solicitations",
4474 			.data		= &ipv6_devconf.rtr_solicits,
4475 			.maxlen		= sizeof(int),
4476 			.mode		= 0644,
4477 			.proc_handler	= proc_dointvec,
4478 		},
4479 		{
4480 			.procname	= "router_solicitation_interval",
4481 			.data		= &ipv6_devconf.rtr_solicit_interval,
4482 			.maxlen		= sizeof(int),
4483 			.mode		= 0644,
4484 			.proc_handler	= proc_dointvec_jiffies,
4485 		},
4486 		{
4487 			.procname	= "router_solicitation_delay",
4488 			.data		= &ipv6_devconf.rtr_solicit_delay,
4489 			.maxlen		= sizeof(int),
4490 			.mode		= 0644,
4491 			.proc_handler	= proc_dointvec_jiffies,
4492 		},
4493 		{
4494 			.procname	= "force_mld_version",
4495 			.data		= &ipv6_devconf.force_mld_version,
4496 			.maxlen		= sizeof(int),
4497 			.mode		= 0644,
4498 			.proc_handler	= proc_dointvec,
4499 		},
4500 #ifdef CONFIG_IPV6_PRIVACY
4501 		{
4502 			.procname	= "use_tempaddr",
4503 			.data		= &ipv6_devconf.use_tempaddr,
4504 			.maxlen		= sizeof(int),
4505 			.mode		= 0644,
4506 			.proc_handler	= proc_dointvec,
4507 		},
4508 		{
4509 			.procname	= "temp_valid_lft",
4510 			.data		= &ipv6_devconf.temp_valid_lft,
4511 			.maxlen		= sizeof(int),
4512 			.mode		= 0644,
4513 			.proc_handler	= proc_dointvec,
4514 		},
4515 		{
4516 			.procname	= "temp_prefered_lft",
4517 			.data		= &ipv6_devconf.temp_prefered_lft,
4518 			.maxlen		= sizeof(int),
4519 			.mode		= 0644,
4520 			.proc_handler	= proc_dointvec,
4521 		},
4522 		{
4523 			.procname	= "regen_max_retry",
4524 			.data		= &ipv6_devconf.regen_max_retry,
4525 			.maxlen		= sizeof(int),
4526 			.mode		= 0644,
4527 			.proc_handler	= proc_dointvec,
4528 		},
4529 		{
4530 			.procname	= "max_desync_factor",
4531 			.data		= &ipv6_devconf.max_desync_factor,
4532 			.maxlen		= sizeof(int),
4533 			.mode		= 0644,
4534 			.proc_handler	= proc_dointvec,
4535 		},
4536 #endif
4537 		{
4538 			.procname	= "max_addresses",
4539 			.data		= &ipv6_devconf.max_addresses,
4540 			.maxlen		= sizeof(int),
4541 			.mode		= 0644,
4542 			.proc_handler	= proc_dointvec,
4543 		},
4544 		{
4545 			.procname	= "accept_ra_defrtr",
4546 			.data		= &ipv6_devconf.accept_ra_defrtr,
4547 			.maxlen		= sizeof(int),
4548 			.mode		= 0644,
4549 			.proc_handler	= proc_dointvec,
4550 		},
4551 		{
4552 			.procname	= "accept_ra_pinfo",
4553 			.data		= &ipv6_devconf.accept_ra_pinfo,
4554 			.maxlen		= sizeof(int),
4555 			.mode		= 0644,
4556 			.proc_handler	= proc_dointvec,
4557 		},
4558 #ifdef CONFIG_IPV6_ROUTER_PREF
4559 		{
4560 			.procname	= "accept_ra_rtr_pref",
4561 			.data		= &ipv6_devconf.accept_ra_rtr_pref,
4562 			.maxlen		= sizeof(int),
4563 			.mode		= 0644,
4564 			.proc_handler	= proc_dointvec,
4565 		},
4566 		{
4567 			.procname	= "router_probe_interval",
4568 			.data		= &ipv6_devconf.rtr_probe_interval,
4569 			.maxlen		= sizeof(int),
4570 			.mode		= 0644,
4571 			.proc_handler	= proc_dointvec_jiffies,
4572 		},
4573 #ifdef CONFIG_IPV6_ROUTE_INFO
4574 		{
4575 			.procname	= "accept_ra_rt_info_max_plen",
4576 			.data		= &ipv6_devconf.accept_ra_rt_info_max_plen,
4577 			.maxlen		= sizeof(int),
4578 			.mode		= 0644,
4579 			.proc_handler	= proc_dointvec,
4580 		},
4581 #endif
4582 #endif
4583 		{
4584 			.procname	= "proxy_ndp",
4585 			.data		= &ipv6_devconf.proxy_ndp,
4586 			.maxlen		= sizeof(int),
4587 			.mode		= 0644,
4588 			.proc_handler	= proc_dointvec,
4589 		},
4590 		{
4591 			.procname	= "accept_source_route",
4592 			.data		= &ipv6_devconf.accept_source_route,
4593 			.maxlen		= sizeof(int),
4594 			.mode		= 0644,
4595 			.proc_handler	= proc_dointvec,
4596 		},
4597 #ifdef CONFIG_IPV6_OPTIMISTIC_DAD
4598 		{
4599 			.procname       = "optimistic_dad",
4600 			.data           = &ipv6_devconf.optimistic_dad,
4601 			.maxlen         = sizeof(int),
4602 			.mode           = 0644,
4603 			.proc_handler   = proc_dointvec,
4604 
4605 		},
4606 #endif
4607 #ifdef CONFIG_IPV6_MROUTE
4608 		{
4609 			.procname	= "mc_forwarding",
4610 			.data		= &ipv6_devconf.mc_forwarding,
4611 			.maxlen		= sizeof(int),
4612 			.mode		= 0444,
4613 			.proc_handler	= proc_dointvec,
4614 		},
4615 #endif
4616 		{
4617 			.procname	= "disable_ipv6",
4618 			.data		= &ipv6_devconf.disable_ipv6,
4619 			.maxlen		= sizeof(int),
4620 			.mode		= 0644,
4621 			.proc_handler	= addrconf_sysctl_disable,
4622 		},
4623 		{
4624 			.procname	= "accept_dad",
4625 			.data		= &ipv6_devconf.accept_dad,
4626 			.maxlen		= sizeof(int),
4627 			.mode		= 0644,
4628 			.proc_handler	= proc_dointvec,
4629 		},
4630 		{
4631 			.procname       = "force_tllao",
4632 			.data           = &ipv6_devconf.force_tllao,
4633 			.maxlen         = sizeof(int),
4634 			.mode           = 0644,
4635 			.proc_handler   = proc_dointvec
4636 		},
4637 		{
4638 			/* sentinel */
4639 		}
4640 	},
4641 };
4642 
__addrconf_sysctl_register(struct net * net,char * dev_name,struct inet6_dev * idev,struct ipv6_devconf * p)4643 static int __addrconf_sysctl_register(struct net *net, char *dev_name,
4644 		struct inet6_dev *idev, struct ipv6_devconf *p)
4645 {
4646 	int i;
4647 	struct addrconf_sysctl_table *t;
4648 
4649 #define ADDRCONF_CTL_PATH_DEV	3
4650 
4651 	struct ctl_path addrconf_ctl_path[] = {
4652 		{ .procname = "net", },
4653 		{ .procname = "ipv6", },
4654 		{ .procname = "conf", },
4655 		{ /* to be set */ },
4656 		{ },
4657 	};
4658 
4659 
4660 	t = kmemdup(&addrconf_sysctl, sizeof(*t), GFP_KERNEL);
4661 	if (t == NULL)
4662 		goto out;
4663 
4664 	for (i = 0; t->addrconf_vars[i].data; i++) {
4665 		t->addrconf_vars[i].data += (char *)p - (char *)&ipv6_devconf;
4666 		t->addrconf_vars[i].extra1 = idev; /* embedded; no ref */
4667 		t->addrconf_vars[i].extra2 = net;
4668 	}
4669 
4670 	/*
4671 	 * Make a copy of dev_name, because '.procname' is regarded as const
4672 	 * by sysctl and we wouldn't want anyone to change it under our feet
4673 	 * (see SIOCSIFNAME).
4674 	 */
4675 	t->dev_name = kstrdup(dev_name, GFP_KERNEL);
4676 	if (!t->dev_name)
4677 		goto free;
4678 
4679 	addrconf_ctl_path[ADDRCONF_CTL_PATH_DEV].procname = t->dev_name;
4680 
4681 	t->sysctl_header = register_net_sysctl_table(net, addrconf_ctl_path,
4682 			t->addrconf_vars);
4683 	if (t->sysctl_header == NULL)
4684 		goto free_procname;
4685 
4686 	p->sysctl = t;
4687 	return 0;
4688 
4689 free_procname:
4690 	kfree(t->dev_name);
4691 free:
4692 	kfree(t);
4693 out:
4694 	return -ENOBUFS;
4695 }
4696 
__addrconf_sysctl_unregister(struct ipv6_devconf * p)4697 static void __addrconf_sysctl_unregister(struct ipv6_devconf *p)
4698 {
4699 	struct addrconf_sysctl_table *t;
4700 
4701 	if (p->sysctl == NULL)
4702 		return;
4703 
4704 	t = p->sysctl;
4705 	p->sysctl = NULL;
4706 	unregister_net_sysctl_table(t->sysctl_header);
4707 	kfree(t->dev_name);
4708 	kfree(t);
4709 }
4710 
addrconf_sysctl_register(struct inet6_dev * idev)4711 static void addrconf_sysctl_register(struct inet6_dev *idev)
4712 {
4713 	neigh_sysctl_register(idev->dev, idev->nd_parms, "ipv6",
4714 			      &ndisc_ifinfo_sysctl_change);
4715 	__addrconf_sysctl_register(dev_net(idev->dev), idev->dev->name,
4716 					idev, &idev->cnf);
4717 }
4718 
addrconf_sysctl_unregister(struct inet6_dev * idev)4719 static void addrconf_sysctl_unregister(struct inet6_dev *idev)
4720 {
4721 	__addrconf_sysctl_unregister(&idev->cnf);
4722 	neigh_sysctl_unregister(idev->nd_parms);
4723 }
4724 
4725 
4726 #endif
4727 
addrconf_init_net(struct net * net)4728 static int __net_init addrconf_init_net(struct net *net)
4729 {
4730 	int err = -ENOMEM;
4731 	struct ipv6_devconf *all, *dflt;
4732 
4733 	all = kmemdup(&ipv6_devconf, sizeof(ipv6_devconf), GFP_KERNEL);
4734 	if (all == NULL)
4735 		goto err_alloc_all;
4736 
4737 	dflt = kmemdup(&ipv6_devconf_dflt, sizeof(ipv6_devconf_dflt), GFP_KERNEL);
4738 	if (dflt == NULL)
4739 		goto err_alloc_dflt;
4740 
4741 	/* these will be inherited by all namespaces */
4742 	dflt->autoconf = ipv6_defaults.autoconf;
4743 	dflt->disable_ipv6 = ipv6_defaults.disable_ipv6;
4744 
4745 	net->ipv6.devconf_all = all;
4746 	net->ipv6.devconf_dflt = dflt;
4747 
4748 #ifdef CONFIG_SYSCTL
4749 	err = __addrconf_sysctl_register(net, "all", NULL, all);
4750 	if (err < 0)
4751 		goto err_reg_all;
4752 
4753 	err = __addrconf_sysctl_register(net, "default", NULL, dflt);
4754 	if (err < 0)
4755 		goto err_reg_dflt;
4756 #endif
4757 	return 0;
4758 
4759 #ifdef CONFIG_SYSCTL
4760 err_reg_dflt:
4761 	__addrconf_sysctl_unregister(all);
4762 err_reg_all:
4763 	kfree(dflt);
4764 #endif
4765 err_alloc_dflt:
4766 	kfree(all);
4767 err_alloc_all:
4768 	return err;
4769 }
4770 
addrconf_exit_net(struct net * net)4771 static void __net_exit addrconf_exit_net(struct net *net)
4772 {
4773 #ifdef CONFIG_SYSCTL
4774 	__addrconf_sysctl_unregister(net->ipv6.devconf_dflt);
4775 	__addrconf_sysctl_unregister(net->ipv6.devconf_all);
4776 #endif
4777 	if (!net_eq(net, &init_net)) {
4778 		kfree(net->ipv6.devconf_dflt);
4779 		kfree(net->ipv6.devconf_all);
4780 	}
4781 }
4782 
4783 static struct pernet_operations addrconf_ops = {
4784 	.init = addrconf_init_net,
4785 	.exit = addrconf_exit_net,
4786 };
4787 
4788 /*
4789  *      Device notifier
4790  */
4791 
register_inet6addr_notifier(struct notifier_block * nb)4792 int register_inet6addr_notifier(struct notifier_block *nb)
4793 {
4794 	return atomic_notifier_chain_register(&inet6addr_chain, nb);
4795 }
4796 EXPORT_SYMBOL(register_inet6addr_notifier);
4797 
unregister_inet6addr_notifier(struct notifier_block * nb)4798 int unregister_inet6addr_notifier(struct notifier_block *nb)
4799 {
4800 	return atomic_notifier_chain_unregister(&inet6addr_chain, nb);
4801 }
4802 EXPORT_SYMBOL(unregister_inet6addr_notifier);
4803 
4804 static struct rtnl_af_ops inet6_ops = {
4805 	.family		  = AF_INET6,
4806 	.fill_link_af	  = inet6_fill_link_af,
4807 	.get_link_af_size = inet6_get_link_af_size,
4808 };
4809 
4810 /*
4811  *	Init / cleanup code
4812  */
4813 
addrconf_init(void)4814 int __init addrconf_init(void)
4815 {
4816 	int i, err;
4817 
4818 	err = ipv6_addr_label_init();
4819 	if (err < 0) {
4820 		printk(KERN_CRIT "IPv6 Addrconf:"
4821 		       " cannot initialize default policy table: %d.\n", err);
4822 		goto out;
4823 	}
4824 
4825 	err = register_pernet_subsys(&addrconf_ops);
4826 	if (err < 0)
4827 		goto out_addrlabel;
4828 
4829 	/* The addrconf netdev notifier requires that loopback_dev
4830 	 * has it's ipv6 private information allocated and setup
4831 	 * before it can bring up and give link-local addresses
4832 	 * to other devices which are up.
4833 	 *
4834 	 * Unfortunately, loopback_dev is not necessarily the first
4835 	 * entry in the global dev_base list of net devices.  In fact,
4836 	 * it is likely to be the very last entry on that list.
4837 	 * So this causes the notifier registry below to try and
4838 	 * give link-local addresses to all devices besides loopback_dev
4839 	 * first, then loopback_dev, which cases all the non-loopback_dev
4840 	 * devices to fail to get a link-local address.
4841 	 *
4842 	 * So, as a temporary fix, allocate the ipv6 structure for
4843 	 * loopback_dev first by hand.
4844 	 * Longer term, all of the dependencies ipv6 has upon the loopback
4845 	 * device and it being up should be removed.
4846 	 */
4847 	rtnl_lock();
4848 	if (!ipv6_add_dev(init_net.loopback_dev))
4849 		err = -ENOMEM;
4850 	rtnl_unlock();
4851 	if (err)
4852 		goto errlo;
4853 
4854 	for (i = 0; i < IN6_ADDR_HSIZE; i++)
4855 		INIT_HLIST_HEAD(&inet6_addr_lst[i]);
4856 
4857 	register_netdevice_notifier(&ipv6_dev_notf);
4858 
4859 	addrconf_verify(0);
4860 
4861 	err = rtnl_af_register(&inet6_ops);
4862 	if (err < 0)
4863 		goto errout_af;
4864 
4865 	err = __rtnl_register(PF_INET6, RTM_GETLINK, NULL, inet6_dump_ifinfo,
4866 			      NULL);
4867 	if (err < 0)
4868 		goto errout;
4869 
4870 	/* Only the first call to __rtnl_register can fail */
4871 	__rtnl_register(PF_INET6, RTM_NEWADDR, inet6_rtm_newaddr, NULL, NULL);
4872 	__rtnl_register(PF_INET6, RTM_DELADDR, inet6_rtm_deladdr, NULL, NULL);
4873 	__rtnl_register(PF_INET6, RTM_GETADDR, inet6_rtm_getaddr,
4874 			inet6_dump_ifaddr, NULL);
4875 	__rtnl_register(PF_INET6, RTM_GETMULTICAST, NULL,
4876 			inet6_dump_ifmcaddr, NULL);
4877 	__rtnl_register(PF_INET6, RTM_GETANYCAST, NULL,
4878 			inet6_dump_ifacaddr, NULL);
4879 
4880 	ipv6_addr_label_rtnl_register();
4881 
4882 	return 0;
4883 errout:
4884 	rtnl_af_unregister(&inet6_ops);
4885 errout_af:
4886 	unregister_netdevice_notifier(&ipv6_dev_notf);
4887 errlo:
4888 	unregister_pernet_subsys(&addrconf_ops);
4889 out_addrlabel:
4890 	ipv6_addr_label_cleanup();
4891 out:
4892 	return err;
4893 }
4894 
addrconf_cleanup(void)4895 void addrconf_cleanup(void)
4896 {
4897 	struct net_device *dev;
4898 	int i;
4899 
4900 	unregister_netdevice_notifier(&ipv6_dev_notf);
4901 	unregister_pernet_subsys(&addrconf_ops);
4902 	ipv6_addr_label_cleanup();
4903 
4904 	rtnl_lock();
4905 
4906 	__rtnl_af_unregister(&inet6_ops);
4907 
4908 	/* clean dev list */
4909 	for_each_netdev(&init_net, dev) {
4910 		if (__in6_dev_get(dev) == NULL)
4911 			continue;
4912 		addrconf_ifdown(dev, 1);
4913 	}
4914 	addrconf_ifdown(init_net.loopback_dev, 2);
4915 
4916 	/*
4917 	 *	Check hash table.
4918 	 */
4919 	spin_lock_bh(&addrconf_hash_lock);
4920 	for (i = 0; i < IN6_ADDR_HSIZE; i++)
4921 		WARN_ON(!hlist_empty(&inet6_addr_lst[i]));
4922 	spin_unlock_bh(&addrconf_hash_lock);
4923 
4924 	del_timer(&addr_chk_timer);
4925 	rtnl_unlock();
4926 }
4927