2 * NET3 IP device support routines.
4 * Version: $Id: devinet.c,v 1.44 2001/10/31 21:55:54 davem Exp $
6 * This program is free software; you can redistribute it and/or
7 * modify it under the terms of the GNU General Public License
8 * as published by the Free Software Foundation; either version
9 * 2 of the License, or (at your option) any later version.
11 * Derived from the IP parts of dev.c 1.0.19
13 * Fred N. van Kempen, <waltje@uWalt.NL.Mugnet.ORG>
14 * Mark Evans, <evansmp@uhura.aston.ac.uk>
17 * Alan Cox, <gw4pts@gw4pts.ampr.org>
18 * Alexey Kuznetsov, <kuznet@ms2.inr.ac.ru>
21 * Alexey Kuznetsov: pa_* fields are replaced with ifaddr
23 * Cyrus Durgin: updated for kmod
24 * Matthias Andree: in devinet_ioctl, compare label and
25 * address (4.4BSD alias style support),
26 * fall back to comparing just the label
31 #include <asm/uaccess.h>
32 #include <asm/system.h>
33 #include <linux/bitops.h>
34 #include <linux/capability.h>
35 #include <linux/module.h>
36 #include <linux/types.h>
37 #include <linux/kernel.h>
38 #include <linux/string.h>
40 #include <linux/socket.h>
41 #include <linux/sockios.h>
43 #include <linux/errno.h>
44 #include <linux/interrupt.h>
45 #include <linux/if_addr.h>
46 #include <linux/if_ether.h>
47 #include <linux/inet.h>
48 #include <linux/netdevice.h>
49 #include <linux/etherdevice.h>
50 #include <linux/skbuff.h>
51 #include <linux/init.h>
52 #include <linux/notifier.h>
53 #include <linux/inetdevice.h>
54 #include <linux/igmp.h>
56 #include <linux/sysctl.h>
58 #include <linux/kmod.h>
62 #include <net/route.h>
63 #include <net/ip_fib.h>
64 #include <net/rtnetlink.h>
66 struct ipv4_devconf ipv4_devconf = {
68 [NET_IPV4_CONF_ACCEPT_REDIRECTS - 1] = 1,
69 [NET_IPV4_CONF_SEND_REDIRECTS - 1] = 1,
70 [NET_IPV4_CONF_SECURE_REDIRECTS - 1] = 1,
71 [NET_IPV4_CONF_SHARED_MEDIA - 1] = 1,
75 static struct ipv4_devconf ipv4_devconf_dflt = {
77 [NET_IPV4_CONF_ACCEPT_REDIRECTS - 1] = 1,
78 [NET_IPV4_CONF_SEND_REDIRECTS - 1] = 1,
79 [NET_IPV4_CONF_SECURE_REDIRECTS - 1] = 1,
80 [NET_IPV4_CONF_SHARED_MEDIA - 1] = 1,
81 [NET_IPV4_CONF_ACCEPT_SOURCE_ROUTE - 1] = 1,
85 #define IPV4_DEVCONF_DFLT(attr) IPV4_DEVCONF(ipv4_devconf_dflt, attr)
87 static const struct nla_policy ifa_ipv4_policy[IFA_MAX+1] = {
88 [IFA_LOCAL] = { .type = NLA_U32 },
89 [IFA_ADDRESS] = { .type = NLA_U32 },
90 [IFA_BROADCAST] = { .type = NLA_U32 },
91 [IFA_ANYCAST] = { .type = NLA_U32 },
92 [IFA_LABEL] = { .type = NLA_STRING, .len = IFNAMSIZ - 1 },
95 static void rtmsg_ifa(int event, struct in_ifaddr *, struct nlmsghdr *, u32);
97 static BLOCKING_NOTIFIER_HEAD(inetaddr_chain);
98 static void inet_del_ifa(struct in_device *in_dev, struct in_ifaddr **ifap,
101 static void devinet_sysctl_register(struct in_device *in_dev,
102 struct ipv4_devconf *p);
103 static void devinet_sysctl_unregister(struct ipv4_devconf *p);
106 /* Locks all the inet devices. */
108 static struct in_ifaddr *inet_alloc_ifa(void)
110 struct in_ifaddr *ifa = kzalloc(sizeof(*ifa), GFP_KERNEL);
113 INIT_RCU_HEAD(&ifa->rcu_head);
119 static void inet_rcu_free_ifa(struct rcu_head *head)
121 struct in_ifaddr *ifa = container_of(head, struct in_ifaddr, rcu_head);
123 in_dev_put(ifa->ifa_dev);
127 static inline void inet_free_ifa(struct in_ifaddr *ifa)
129 call_rcu(&ifa->rcu_head, inet_rcu_free_ifa);
132 void in_dev_finish_destroy(struct in_device *idev)
134 struct net_device *dev = idev->dev;
136 BUG_TRAP(!idev->ifa_list);
137 BUG_TRAP(!idev->mc_list);
138 #ifdef NET_REFCNT_DEBUG
139 printk(KERN_DEBUG "in_dev_finish_destroy: %p=%s\n",
140 idev, dev ? dev->name : "NIL");
144 printk("Freeing alive in_device %p\n", idev);
150 static struct in_device *inetdev_init(struct net_device *dev)
152 struct in_device *in_dev;
156 in_dev = kzalloc(sizeof(*in_dev), GFP_KERNEL);
159 INIT_RCU_HEAD(&in_dev->rcu_head);
160 memcpy(&in_dev->cnf, &ipv4_devconf_dflt, sizeof(in_dev->cnf));
161 in_dev->cnf.sysctl = NULL;
163 if ((in_dev->arp_parms = neigh_parms_alloc(dev, &arp_tbl)) == NULL)
165 /* Reference in_dev->dev */
168 neigh_sysctl_register(dev, in_dev->arp_parms, NET_IPV4,
169 NET_IPV4_NEIGH, "ipv4", NULL, NULL);
172 /* Account for reference dev->ip_ptr (below) */
176 devinet_sysctl_register(in_dev, &in_dev->cnf);
178 ip_mc_init_dev(in_dev);
179 if (dev->flags & IFF_UP)
182 /* we can receive as soon as ip_ptr is set -- do this last */
183 rcu_assign_pointer(dev->ip_ptr, in_dev);
192 static void in_dev_rcu_put(struct rcu_head *head)
194 struct in_device *idev = container_of(head, struct in_device, rcu_head);
198 static void inetdev_destroy(struct in_device *in_dev)
200 struct in_ifaddr *ifa;
201 struct net_device *dev;
209 ip_mc_destroy_dev(in_dev);
211 while ((ifa = in_dev->ifa_list) != NULL) {
212 inet_del_ifa(in_dev, &in_dev->ifa_list, 0);
217 devinet_sysctl_unregister(&in_dev->cnf);
223 neigh_sysctl_unregister(in_dev->arp_parms);
225 neigh_parms_release(&arp_tbl, in_dev->arp_parms);
228 call_rcu(&in_dev->rcu_head, in_dev_rcu_put);
231 int inet_addr_onlink(struct in_device *in_dev, __be32 a, __be32 b)
234 for_primary_ifa(in_dev) {
235 if (inet_ifa_match(a, ifa)) {
236 if (!b || inet_ifa_match(b, ifa)) {
241 } endfor_ifa(in_dev);
246 static void __inet_del_ifa(struct in_device *in_dev, struct in_ifaddr **ifap,
247 int destroy, struct nlmsghdr *nlh, u32 pid)
249 struct in_ifaddr *promote = NULL;
250 struct in_ifaddr *ifa, *ifa1 = *ifap;
251 struct in_ifaddr *last_prim = in_dev->ifa_list;
252 struct in_ifaddr *prev_prom = NULL;
253 int do_promote = IN_DEV_PROMOTE_SECONDARIES(in_dev);
257 /* 1. Deleting primary ifaddr forces deletion all secondaries
258 * unless alias promotion is set
261 if (!(ifa1->ifa_flags & IFA_F_SECONDARY)) {
262 struct in_ifaddr **ifap1 = &ifa1->ifa_next;
264 while ((ifa = *ifap1) != NULL) {
265 if (!(ifa->ifa_flags & IFA_F_SECONDARY) &&
266 ifa1->ifa_scope <= ifa->ifa_scope)
269 if (!(ifa->ifa_flags & IFA_F_SECONDARY) ||
270 ifa1->ifa_mask != ifa->ifa_mask ||
271 !inet_ifa_match(ifa1->ifa_address, ifa)) {
272 ifap1 = &ifa->ifa_next;
278 *ifap1 = ifa->ifa_next;
280 rtmsg_ifa(RTM_DELADDR, ifa, nlh, pid);
281 blocking_notifier_call_chain(&inetaddr_chain,
293 *ifap = ifa1->ifa_next;
295 /* 3. Announce address deletion */
297 /* Send message first, then call notifier.
298 At first sight, FIB update triggered by notifier
299 will refer to already deleted ifaddr, that could confuse
300 netlink listeners. It is not true: look, gated sees
301 that route deleted and if it still thinks that ifaddr
302 is valid, it will try to restore deleted routes... Grr.
303 So that, this order is correct.
305 rtmsg_ifa(RTM_DELADDR, ifa1, nlh, pid);
306 blocking_notifier_call_chain(&inetaddr_chain, NETDEV_DOWN, ifa1);
311 prev_prom->ifa_next = promote->ifa_next;
312 promote->ifa_next = last_prim->ifa_next;
313 last_prim->ifa_next = promote;
316 promote->ifa_flags &= ~IFA_F_SECONDARY;
317 rtmsg_ifa(RTM_NEWADDR, promote, nlh, pid);
318 blocking_notifier_call_chain(&inetaddr_chain,
320 for (ifa = promote->ifa_next; ifa; ifa = ifa->ifa_next) {
321 if (ifa1->ifa_mask != ifa->ifa_mask ||
322 !inet_ifa_match(ifa1->ifa_address, ifa))
332 static void inet_del_ifa(struct in_device *in_dev, struct in_ifaddr **ifap,
335 __inet_del_ifa(in_dev, ifap, destroy, NULL, 0);
338 static int __inet_insert_ifa(struct in_ifaddr *ifa, struct nlmsghdr *nlh,
341 struct in_device *in_dev = ifa->ifa_dev;
342 struct in_ifaddr *ifa1, **ifap, **last_primary;
346 if (!ifa->ifa_local) {
351 ifa->ifa_flags &= ~IFA_F_SECONDARY;
352 last_primary = &in_dev->ifa_list;
354 for (ifap = &in_dev->ifa_list; (ifa1 = *ifap) != NULL;
355 ifap = &ifa1->ifa_next) {
356 if (!(ifa1->ifa_flags & IFA_F_SECONDARY) &&
357 ifa->ifa_scope <= ifa1->ifa_scope)
358 last_primary = &ifa1->ifa_next;
359 if (ifa1->ifa_mask == ifa->ifa_mask &&
360 inet_ifa_match(ifa1->ifa_address, ifa)) {
361 if (ifa1->ifa_local == ifa->ifa_local) {
365 if (ifa1->ifa_scope != ifa->ifa_scope) {
369 ifa->ifa_flags |= IFA_F_SECONDARY;
373 if (!(ifa->ifa_flags & IFA_F_SECONDARY)) {
374 net_srandom(ifa->ifa_local);
378 ifa->ifa_next = *ifap;
381 /* Send message first, then call notifier.
382 Notifier will trigger FIB update, so that
383 listeners of netlink will know about new ifaddr */
384 rtmsg_ifa(RTM_NEWADDR, ifa, nlh, pid);
385 blocking_notifier_call_chain(&inetaddr_chain, NETDEV_UP, ifa);
390 static int inet_insert_ifa(struct in_ifaddr *ifa)
392 return __inet_insert_ifa(ifa, NULL, 0);
395 static int inet_set_ifa(struct net_device *dev, struct in_ifaddr *ifa)
397 struct in_device *in_dev = __in_dev_get_rtnl(dev);
405 ipv4_devconf_setall(in_dev);
406 if (ifa->ifa_dev != in_dev) {
407 BUG_TRAP(!ifa->ifa_dev);
409 ifa->ifa_dev = in_dev;
411 if (LOOPBACK(ifa->ifa_local))
412 ifa->ifa_scope = RT_SCOPE_HOST;
413 return inet_insert_ifa(ifa);
416 struct in_device *inetdev_by_index(int ifindex)
418 struct net_device *dev;
419 struct in_device *in_dev = NULL;
420 read_lock(&dev_base_lock);
421 dev = __dev_get_by_index(&init_net, ifindex);
423 in_dev = in_dev_get(dev);
424 read_unlock(&dev_base_lock);
428 /* Called only from RTNL semaphored context. No locks. */
430 struct in_ifaddr *inet_ifa_byprefix(struct in_device *in_dev, __be32 prefix,
435 for_primary_ifa(in_dev) {
436 if (ifa->ifa_mask == mask && inet_ifa_match(prefix, ifa))
438 } endfor_ifa(in_dev);
442 static int inet_rtm_deladdr(struct sk_buff *skb, struct nlmsghdr *nlh, void *arg)
444 struct nlattr *tb[IFA_MAX+1];
445 struct in_device *in_dev;
446 struct ifaddrmsg *ifm;
447 struct in_ifaddr *ifa, **ifap;
452 err = nlmsg_parse(nlh, sizeof(*ifm), tb, IFA_MAX, ifa_ipv4_policy);
456 ifm = nlmsg_data(nlh);
457 in_dev = inetdev_by_index(ifm->ifa_index);
458 if (in_dev == NULL) {
463 __in_dev_put(in_dev);
465 for (ifap = &in_dev->ifa_list; (ifa = *ifap) != NULL;
466 ifap = &ifa->ifa_next) {
468 ifa->ifa_local != nla_get_be32(tb[IFA_LOCAL]))
471 if (tb[IFA_LABEL] && nla_strcmp(tb[IFA_LABEL], ifa->ifa_label))
474 if (tb[IFA_ADDRESS] &&
475 (ifm->ifa_prefixlen != ifa->ifa_prefixlen ||
476 !inet_ifa_match(nla_get_be32(tb[IFA_ADDRESS]), ifa)))
479 __inet_del_ifa(in_dev, ifap, 1, nlh, NETLINK_CB(skb).pid);
483 err = -EADDRNOTAVAIL;
488 static struct in_ifaddr *rtm_to_ifaddr(struct nlmsghdr *nlh)
490 struct nlattr *tb[IFA_MAX+1];
491 struct in_ifaddr *ifa;
492 struct ifaddrmsg *ifm;
493 struct net_device *dev;
494 struct in_device *in_dev;
497 err = nlmsg_parse(nlh, sizeof(*ifm), tb, IFA_MAX, ifa_ipv4_policy);
501 ifm = nlmsg_data(nlh);
502 if (ifm->ifa_prefixlen > 32 || tb[IFA_LOCAL] == NULL) {
507 dev = __dev_get_by_index(&init_net, ifm->ifa_index);
513 in_dev = __in_dev_get_rtnl(dev);
514 if (in_dev == NULL) {
519 ifa = inet_alloc_ifa();
522 * A potential indev allocation can be left alive, it stays
523 * assigned to its device and is destroy with it.
529 ipv4_devconf_setall(in_dev);
532 if (tb[IFA_ADDRESS] == NULL)
533 tb[IFA_ADDRESS] = tb[IFA_LOCAL];
535 ifa->ifa_prefixlen = ifm->ifa_prefixlen;
536 ifa->ifa_mask = inet_make_mask(ifm->ifa_prefixlen);
537 ifa->ifa_flags = ifm->ifa_flags;
538 ifa->ifa_scope = ifm->ifa_scope;
539 ifa->ifa_dev = in_dev;
541 ifa->ifa_local = nla_get_be32(tb[IFA_LOCAL]);
542 ifa->ifa_address = nla_get_be32(tb[IFA_ADDRESS]);
544 if (tb[IFA_BROADCAST])
545 ifa->ifa_broadcast = nla_get_be32(tb[IFA_BROADCAST]);
548 ifa->ifa_anycast = nla_get_be32(tb[IFA_ANYCAST]);
551 nla_strlcpy(ifa->ifa_label, tb[IFA_LABEL], IFNAMSIZ);
553 memcpy(ifa->ifa_label, dev->name, IFNAMSIZ);
561 static int inet_rtm_newaddr(struct sk_buff *skb, struct nlmsghdr *nlh, void *arg)
563 struct in_ifaddr *ifa;
567 ifa = rtm_to_ifaddr(nlh);
571 return __inet_insert_ifa(ifa, nlh, NETLINK_CB(skb).pid);
575 * Determine a default network mask, based on the IP address.
578 static __inline__ int inet_abc_len(__be32 addr)
580 int rc = -1; /* Something else, probably a multicast. */
585 __u32 haddr = ntohl(addr);
587 if (IN_CLASSA(haddr))
589 else if (IN_CLASSB(haddr))
591 else if (IN_CLASSC(haddr))
599 int devinet_ioctl(unsigned int cmd, void __user *arg)
602 struct sockaddr_in sin_orig;
603 struct sockaddr_in *sin = (struct sockaddr_in *)&ifr.ifr_addr;
604 struct in_device *in_dev;
605 struct in_ifaddr **ifap = NULL;
606 struct in_ifaddr *ifa = NULL;
607 struct net_device *dev;
610 int tryaddrmatch = 0;
613 * Fetch the caller's info block into kernel space
616 if (copy_from_user(&ifr, arg, sizeof(struct ifreq)))
618 ifr.ifr_name[IFNAMSIZ - 1] = 0;
620 /* save original address for comparison */
621 memcpy(&sin_orig, sin, sizeof(*sin));
623 colon = strchr(ifr.ifr_name, ':');
628 dev_load(&init_net, ifr.ifr_name);
632 case SIOCGIFADDR: /* Get interface address */
633 case SIOCGIFBRDADDR: /* Get the broadcast address */
634 case SIOCGIFDSTADDR: /* Get the destination address */
635 case SIOCGIFNETMASK: /* Get the netmask for the interface */
636 /* Note that these ioctls will not sleep,
637 so that we do not impose a lock.
638 One day we will be forced to put shlock here (I mean SMP)
640 tryaddrmatch = (sin_orig.sin_family == AF_INET);
641 memset(sin, 0, sizeof(*sin));
642 sin->sin_family = AF_INET;
647 if (!capable(CAP_NET_ADMIN))
650 case SIOCSIFADDR: /* Set interface address (and family) */
651 case SIOCSIFBRDADDR: /* Set the broadcast address */
652 case SIOCSIFDSTADDR: /* Set the destination address */
653 case SIOCSIFNETMASK: /* Set the netmask for the interface */
655 if (!capable(CAP_NET_ADMIN))
658 if (sin->sin_family != AF_INET)
669 if ((dev = __dev_get_by_name(&init_net, ifr.ifr_name)) == NULL)
675 if ((in_dev = __in_dev_get_rtnl(dev)) != NULL) {
677 /* Matthias Andree */
678 /* compare label and address (4.4BSD style) */
679 /* note: we only do this for a limited set of ioctls
680 and only if the original address family was AF_INET.
681 This is checked above. */
682 for (ifap = &in_dev->ifa_list; (ifa = *ifap) != NULL;
683 ifap = &ifa->ifa_next) {
684 if (!strcmp(ifr.ifr_name, ifa->ifa_label) &&
685 sin_orig.sin_addr.s_addr ==
691 /* we didn't get a match, maybe the application is
692 4.3BSD-style and passed in junk so we fall back to
693 comparing just the label */
695 for (ifap = &in_dev->ifa_list; (ifa = *ifap) != NULL;
696 ifap = &ifa->ifa_next)
697 if (!strcmp(ifr.ifr_name, ifa->ifa_label))
702 ret = -EADDRNOTAVAIL;
703 if (!ifa && cmd != SIOCSIFADDR && cmd != SIOCSIFFLAGS)
707 case SIOCGIFADDR: /* Get interface address */
708 sin->sin_addr.s_addr = ifa->ifa_local;
711 case SIOCGIFBRDADDR: /* Get the broadcast address */
712 sin->sin_addr.s_addr = ifa->ifa_broadcast;
715 case SIOCGIFDSTADDR: /* Get the destination address */
716 sin->sin_addr.s_addr = ifa->ifa_address;
719 case SIOCGIFNETMASK: /* Get the netmask for the interface */
720 sin->sin_addr.s_addr = ifa->ifa_mask;
725 ret = -EADDRNOTAVAIL;
729 if (!(ifr.ifr_flags & IFF_UP))
730 inet_del_ifa(in_dev, ifap, 1);
733 ret = dev_change_flags(dev, ifr.ifr_flags);
736 case SIOCSIFADDR: /* Set interface address (and family) */
738 if (inet_abc_len(sin->sin_addr.s_addr) < 0)
743 if ((ifa = inet_alloc_ifa()) == NULL)
746 memcpy(ifa->ifa_label, ifr.ifr_name, IFNAMSIZ);
748 memcpy(ifa->ifa_label, dev->name, IFNAMSIZ);
751 if (ifa->ifa_local == sin->sin_addr.s_addr)
753 inet_del_ifa(in_dev, ifap, 0);
754 ifa->ifa_broadcast = 0;
755 ifa->ifa_anycast = 0;
758 ifa->ifa_address = ifa->ifa_local = sin->sin_addr.s_addr;
760 if (!(dev->flags & IFF_POINTOPOINT)) {
761 ifa->ifa_prefixlen = inet_abc_len(ifa->ifa_address);
762 ifa->ifa_mask = inet_make_mask(ifa->ifa_prefixlen);
763 if ((dev->flags & IFF_BROADCAST) &&
764 ifa->ifa_prefixlen < 31)
765 ifa->ifa_broadcast = ifa->ifa_address |
768 ifa->ifa_prefixlen = 32;
769 ifa->ifa_mask = inet_make_mask(32);
771 ret = inet_set_ifa(dev, ifa);
774 case SIOCSIFBRDADDR: /* Set the broadcast address */
776 if (ifa->ifa_broadcast != sin->sin_addr.s_addr) {
777 inet_del_ifa(in_dev, ifap, 0);
778 ifa->ifa_broadcast = sin->sin_addr.s_addr;
779 inet_insert_ifa(ifa);
783 case SIOCSIFDSTADDR: /* Set the destination address */
785 if (ifa->ifa_address == sin->sin_addr.s_addr)
788 if (inet_abc_len(sin->sin_addr.s_addr) < 0)
791 inet_del_ifa(in_dev, ifap, 0);
792 ifa->ifa_address = sin->sin_addr.s_addr;
793 inet_insert_ifa(ifa);
796 case SIOCSIFNETMASK: /* Set the netmask for the interface */
799 * The mask we set must be legal.
802 if (bad_mask(sin->sin_addr.s_addr, 0))
805 if (ifa->ifa_mask != sin->sin_addr.s_addr) {
806 __be32 old_mask = ifa->ifa_mask;
807 inet_del_ifa(in_dev, ifap, 0);
808 ifa->ifa_mask = sin->sin_addr.s_addr;
809 ifa->ifa_prefixlen = inet_mask_len(ifa->ifa_mask);
811 /* See if current broadcast address matches
812 * with current netmask, then recalculate
813 * the broadcast address. Otherwise it's a
814 * funny address, so don't touch it since
815 * the user seems to know what (s)he's doing...
817 if ((dev->flags & IFF_BROADCAST) &&
818 (ifa->ifa_prefixlen < 31) &&
819 (ifa->ifa_broadcast ==
820 (ifa->ifa_local|~old_mask))) {
821 ifa->ifa_broadcast = (ifa->ifa_local |
822 ~sin->sin_addr.s_addr);
824 inet_insert_ifa(ifa);
834 ret = copy_to_user(arg, &ifr, sizeof(struct ifreq)) ? -EFAULT : 0;
838 static int inet_gifconf(struct net_device *dev, char __user *buf, int len)
840 struct in_device *in_dev = __in_dev_get_rtnl(dev);
841 struct in_ifaddr *ifa;
845 if (!in_dev || (ifa = in_dev->ifa_list) == NULL)
848 for (; ifa; ifa = ifa->ifa_next) {
853 if (len < (int) sizeof(ifr))
855 memset(&ifr, 0, sizeof(struct ifreq));
857 strcpy(ifr.ifr_name, ifa->ifa_label);
859 strcpy(ifr.ifr_name, dev->name);
861 (*(struct sockaddr_in *)&ifr.ifr_addr).sin_family = AF_INET;
862 (*(struct sockaddr_in *)&ifr.ifr_addr).sin_addr.s_addr =
865 if (copy_to_user(buf, &ifr, sizeof(struct ifreq))) {
869 buf += sizeof(struct ifreq);
870 len -= sizeof(struct ifreq);
871 done += sizeof(struct ifreq);
877 __be32 inet_select_addr(const struct net_device *dev, __be32 dst, int scope)
880 struct in_device *in_dev;
883 in_dev = __in_dev_get_rcu(dev);
887 for_primary_ifa(in_dev) {
888 if (ifa->ifa_scope > scope)
890 if (!dst || inet_ifa_match(dst, ifa)) {
891 addr = ifa->ifa_local;
895 addr = ifa->ifa_local;
896 } endfor_ifa(in_dev);
903 /* Not loopback addresses on loopback should be preferred
904 in this case. It is importnat that lo is the first interface
907 read_lock(&dev_base_lock);
909 for_each_netdev(&init_net, dev) {
910 if ((in_dev = __in_dev_get_rcu(dev)) == NULL)
913 for_primary_ifa(in_dev) {
914 if (ifa->ifa_scope != RT_SCOPE_LINK &&
915 ifa->ifa_scope <= scope) {
916 addr = ifa->ifa_local;
917 goto out_unlock_both;
919 } endfor_ifa(in_dev);
922 read_unlock(&dev_base_lock);
928 static __be32 confirm_addr_indev(struct in_device *in_dev, __be32 dst,
929 __be32 local, int scope)
936 (local == ifa->ifa_local || !local) &&
937 ifa->ifa_scope <= scope) {
938 addr = ifa->ifa_local;
943 same = (!local || inet_ifa_match(local, ifa)) &&
944 (!dst || inet_ifa_match(dst, ifa));
948 /* Is the selected addr into dst subnet? */
949 if (inet_ifa_match(addr, ifa))
951 /* No, then can we use new local src? */
952 if (ifa->ifa_scope <= scope) {
953 addr = ifa->ifa_local;
956 /* search for large dst subnet for addr */
960 } endfor_ifa(in_dev);
962 return same? addr : 0;
966 * Confirm that local IP address exists using wildcards:
967 * - dev: only on this interface, 0=any interface
968 * - dst: only in the same subnet as dst, 0=any dst
969 * - local: address, 0=autoselect the local address
970 * - scope: maximum allowed scope value for the local address
972 __be32 inet_confirm_addr(const struct net_device *dev, __be32 dst, __be32 local, int scope)
975 struct in_device *in_dev;
979 if ((in_dev = __in_dev_get_rcu(dev)))
980 addr = confirm_addr_indev(in_dev, dst, local, scope);
986 read_lock(&dev_base_lock);
988 for_each_netdev(&init_net, dev) {
989 if ((in_dev = __in_dev_get_rcu(dev))) {
990 addr = confirm_addr_indev(in_dev, dst, local, scope);
996 read_unlock(&dev_base_lock);
1005 int register_inetaddr_notifier(struct notifier_block *nb)
1007 return blocking_notifier_chain_register(&inetaddr_chain, nb);
1010 int unregister_inetaddr_notifier(struct notifier_block *nb)
1012 return blocking_notifier_chain_unregister(&inetaddr_chain, nb);
1015 /* Rename ifa_labels for a device name change. Make some effort to preserve existing
1016 * alias numbering and to create unique labels if possible.
1018 static void inetdev_changename(struct net_device *dev, struct in_device *in_dev)
1020 struct in_ifaddr *ifa;
1023 for (ifa = in_dev->ifa_list; ifa; ifa = ifa->ifa_next) {
1024 char old[IFNAMSIZ], *dot;
1026 memcpy(old, ifa->ifa_label, IFNAMSIZ);
1027 memcpy(ifa->ifa_label, dev->name, IFNAMSIZ);
1030 dot = strchr(old, ':');
1032 sprintf(old, ":%d", named);
1035 if (strlen(dot) + strlen(dev->name) < IFNAMSIZ) {
1036 strcat(ifa->ifa_label, dot);
1038 strcpy(ifa->ifa_label + (IFNAMSIZ - strlen(dot) - 1), dot);
1043 /* Called only under RTNL semaphore */
1045 static int inetdev_event(struct notifier_block *this, unsigned long event,
1048 struct net_device *dev = ptr;
1049 struct in_device *in_dev = __in_dev_get_rtnl(dev);
1051 if (dev->nd_net != &init_net)
1057 if (event == NETDEV_REGISTER) {
1058 in_dev = inetdev_init(dev);
1060 return notifier_from_errno(-ENOMEM);
1061 if (dev->flags & IFF_LOOPBACK) {
1062 IN_DEV_CONF_SET(in_dev, NOXFRM, 1);
1063 IN_DEV_CONF_SET(in_dev, NOPOLICY, 1);
1070 case NETDEV_REGISTER:
1071 printk(KERN_DEBUG "inetdev_event: bug\n");
1077 if (dev->flags & IFF_LOOPBACK) {
1078 struct in_ifaddr *ifa;
1079 if ((ifa = inet_alloc_ifa()) != NULL) {
1081 ifa->ifa_address = htonl(INADDR_LOOPBACK);
1082 ifa->ifa_prefixlen = 8;
1083 ifa->ifa_mask = inet_make_mask(8);
1084 in_dev_hold(in_dev);
1085 ifa->ifa_dev = in_dev;
1086 ifa->ifa_scope = RT_SCOPE_HOST;
1087 memcpy(ifa->ifa_label, dev->name, IFNAMSIZ);
1088 inet_insert_ifa(ifa);
1096 case NETDEV_CHANGEMTU:
1099 /* MTU falled under 68, disable IP */
1100 case NETDEV_UNREGISTER:
1101 inetdev_destroy(in_dev);
1103 case NETDEV_CHANGENAME:
1104 /* Do not notify about label change, this event is
1105 * not interesting to applications using netlink.
1107 inetdev_changename(dev, in_dev);
1109 #ifdef CONFIG_SYSCTL
1110 devinet_sysctl_unregister(&in_dev->cnf);
1111 neigh_sysctl_unregister(in_dev->arp_parms);
1112 neigh_sysctl_register(dev, in_dev->arp_parms, NET_IPV4,
1113 NET_IPV4_NEIGH, "ipv4", NULL, NULL);
1114 devinet_sysctl_register(in_dev, &in_dev->cnf);
1122 static struct notifier_block ip_netdev_notifier = {
1123 .notifier_call =inetdev_event,
1126 static inline size_t inet_nlmsg_size(void)
1128 return NLMSG_ALIGN(sizeof(struct ifaddrmsg))
1129 + nla_total_size(4) /* IFA_ADDRESS */
1130 + nla_total_size(4) /* IFA_LOCAL */
1131 + nla_total_size(4) /* IFA_BROADCAST */
1132 + nla_total_size(4) /* IFA_ANYCAST */
1133 + nla_total_size(IFNAMSIZ); /* IFA_LABEL */
1136 static int inet_fill_ifaddr(struct sk_buff *skb, struct in_ifaddr *ifa,
1137 u32 pid, u32 seq, int event, unsigned int flags)
1139 struct ifaddrmsg *ifm;
1140 struct nlmsghdr *nlh;
1142 nlh = nlmsg_put(skb, pid, seq, event, sizeof(*ifm), flags);
1146 ifm = nlmsg_data(nlh);
1147 ifm->ifa_family = AF_INET;
1148 ifm->ifa_prefixlen = ifa->ifa_prefixlen;
1149 ifm->ifa_flags = ifa->ifa_flags|IFA_F_PERMANENT;
1150 ifm->ifa_scope = ifa->ifa_scope;
1151 ifm->ifa_index = ifa->ifa_dev->dev->ifindex;
1153 if (ifa->ifa_address)
1154 NLA_PUT_BE32(skb, IFA_ADDRESS, ifa->ifa_address);
1157 NLA_PUT_BE32(skb, IFA_LOCAL, ifa->ifa_local);
1159 if (ifa->ifa_broadcast)
1160 NLA_PUT_BE32(skb, IFA_BROADCAST, ifa->ifa_broadcast);
1162 if (ifa->ifa_anycast)
1163 NLA_PUT_BE32(skb, IFA_ANYCAST, ifa->ifa_anycast);
1165 if (ifa->ifa_label[0])
1166 NLA_PUT_STRING(skb, IFA_LABEL, ifa->ifa_label);
1168 return nlmsg_end(skb, nlh);
1171 nlmsg_cancel(skb, nlh);
1175 static int inet_dump_ifaddr(struct sk_buff *skb, struct netlink_callback *cb)
1178 struct net_device *dev;
1179 struct in_device *in_dev;
1180 struct in_ifaddr *ifa;
1181 int s_ip_idx, s_idx = cb->args[0];
1183 s_ip_idx = ip_idx = cb->args[1];
1185 for_each_netdev(&init_net, dev) {
1190 if ((in_dev = __in_dev_get_rtnl(dev)) == NULL)
1193 for (ifa = in_dev->ifa_list, ip_idx = 0; ifa;
1194 ifa = ifa->ifa_next, ip_idx++) {
1195 if (ip_idx < s_ip_idx)
1197 if (inet_fill_ifaddr(skb, ifa, NETLINK_CB(cb->skb).pid,
1199 RTM_NEWADDR, NLM_F_MULTI) <= 0)
1208 cb->args[1] = ip_idx;
1213 static void rtmsg_ifa(int event, struct in_ifaddr* ifa, struct nlmsghdr *nlh,
1216 struct sk_buff *skb;
1217 u32 seq = nlh ? nlh->nlmsg_seq : 0;
1220 skb = nlmsg_new(inet_nlmsg_size(), GFP_KERNEL);
1224 err = inet_fill_ifaddr(skb, ifa, pid, seq, event, 0);
1226 /* -EMSGSIZE implies BUG in inet_nlmsg_size() */
1227 WARN_ON(err == -EMSGSIZE);
1231 err = rtnl_notify(skb, pid, RTNLGRP_IPV4_IFADDR, nlh, GFP_KERNEL);
1234 rtnl_set_sk_err(RTNLGRP_IPV4_IFADDR, err);
1237 #ifdef CONFIG_SYSCTL
1239 static void devinet_copy_dflt_conf(int i)
1241 struct net_device *dev;
1243 read_lock(&dev_base_lock);
1244 for_each_netdev(&init_net, dev) {
1245 struct in_device *in_dev;
1247 in_dev = __in_dev_get_rcu(dev);
1248 if (in_dev && !test_bit(i, in_dev->cnf.state))
1249 in_dev->cnf.data[i] = ipv4_devconf_dflt.data[i];
1252 read_unlock(&dev_base_lock);
1255 static int devinet_conf_proc(ctl_table *ctl, int write,
1256 struct file* filp, void __user *buffer,
1257 size_t *lenp, loff_t *ppos)
1259 int ret = proc_dointvec(ctl, write, filp, buffer, lenp, ppos);
1262 struct ipv4_devconf *cnf = ctl->extra1;
1263 int i = (int *)ctl->data - cnf->data;
1265 set_bit(i, cnf->state);
1267 if (cnf == &ipv4_devconf_dflt)
1268 devinet_copy_dflt_conf(i);
1274 static int devinet_conf_sysctl(ctl_table *table, int __user *name, int nlen,
1275 void __user *oldval, size_t __user *oldlenp,
1276 void __user *newval, size_t newlen)
1278 struct ipv4_devconf *cnf;
1279 int *valp = table->data;
1283 if (!newval || !newlen)
1286 if (newlen != sizeof(int))
1289 if (get_user(new, (int __user *)newval))
1295 if (oldval && oldlenp) {
1298 if (get_user(len, oldlenp))
1302 if (len > table->maxlen)
1303 len = table->maxlen;
1304 if (copy_to_user(oldval, valp, len))
1306 if (put_user(len, oldlenp))
1313 cnf = table->extra1;
1314 i = (int *)table->data - cnf->data;
1316 set_bit(i, cnf->state);
1318 if (cnf == &ipv4_devconf_dflt)
1319 devinet_copy_dflt_conf(i);
1324 void inet_forward_change(void)
1326 struct net_device *dev;
1327 int on = IPV4_DEVCONF_ALL(FORWARDING);
1329 IPV4_DEVCONF_ALL(ACCEPT_REDIRECTS) = !on;
1330 IPV4_DEVCONF_DFLT(FORWARDING) = on;
1332 read_lock(&dev_base_lock);
1333 for_each_netdev(&init_net, dev) {
1334 struct in_device *in_dev;
1336 in_dev = __in_dev_get_rcu(dev);
1338 IN_DEV_CONF_SET(in_dev, FORWARDING, on);
1341 read_unlock(&dev_base_lock);
1346 static int devinet_sysctl_forward(ctl_table *ctl, int write,
1347 struct file* filp, void __user *buffer,
1348 size_t *lenp, loff_t *ppos)
1350 int *valp = ctl->data;
1352 int ret = proc_dointvec(ctl, write, filp, buffer, lenp, ppos);
1354 if (write && *valp != val) {
1355 if (valp == &IPV4_DEVCONF_ALL(FORWARDING))
1356 inet_forward_change();
1357 else if (valp != &IPV4_DEVCONF_DFLT(FORWARDING))
1364 int ipv4_doint_and_flush(ctl_table *ctl, int write,
1365 struct file* filp, void __user *buffer,
1366 size_t *lenp, loff_t *ppos)
1368 int *valp = ctl->data;
1370 int ret = proc_dointvec(ctl, write, filp, buffer, lenp, ppos);
1372 if (write && *valp != val)
1378 int ipv4_doint_and_flush_strategy(ctl_table *table, int __user *name, int nlen,
1379 void __user *oldval, size_t __user *oldlenp,
1380 void __user *newval, size_t newlen)
1382 int ret = devinet_conf_sysctl(table, name, nlen, oldval, oldlenp,
1392 #define DEVINET_SYSCTL_ENTRY(attr, name, mval, proc, sysctl) \
1394 .ctl_name = NET_IPV4_CONF_ ## attr, \
1396 .data = ipv4_devconf.data + \
1397 NET_IPV4_CONF_ ## attr - 1, \
1398 .maxlen = sizeof(int), \
1400 .proc_handler = proc, \
1401 .strategy = sysctl, \
1402 .extra1 = &ipv4_devconf, \
1405 #define DEVINET_SYSCTL_RW_ENTRY(attr, name) \
1406 DEVINET_SYSCTL_ENTRY(attr, name, 0644, devinet_conf_proc, \
1407 devinet_conf_sysctl)
1409 #define DEVINET_SYSCTL_RO_ENTRY(attr, name) \
1410 DEVINET_SYSCTL_ENTRY(attr, name, 0444, devinet_conf_proc, \
1411 devinet_conf_sysctl)
1413 #define DEVINET_SYSCTL_COMPLEX_ENTRY(attr, name, proc, sysctl) \
1414 DEVINET_SYSCTL_ENTRY(attr, name, 0644, proc, sysctl)
1416 #define DEVINET_SYSCTL_FLUSHING_ENTRY(attr, name) \
1417 DEVINET_SYSCTL_COMPLEX_ENTRY(attr, name, ipv4_doint_and_flush, \
1418 ipv4_doint_and_flush_strategy)
1420 static struct devinet_sysctl_table {
1421 struct ctl_table_header *sysctl_header;
1422 ctl_table devinet_vars[__NET_IPV4_CONF_MAX];
1423 ctl_table devinet_dev[2];
1424 ctl_table devinet_conf_dir[2];
1425 ctl_table devinet_proto_dir[2];
1426 ctl_table devinet_root_dir[2];
1427 } devinet_sysctl = {
1429 DEVINET_SYSCTL_COMPLEX_ENTRY(FORWARDING, "forwarding",
1430 devinet_sysctl_forward,
1431 devinet_conf_sysctl),
1432 DEVINET_SYSCTL_RO_ENTRY(MC_FORWARDING, "mc_forwarding"),
1434 DEVINET_SYSCTL_RW_ENTRY(ACCEPT_REDIRECTS, "accept_redirects"),
1435 DEVINET_SYSCTL_RW_ENTRY(SECURE_REDIRECTS, "secure_redirects"),
1436 DEVINET_SYSCTL_RW_ENTRY(SHARED_MEDIA, "shared_media"),
1437 DEVINET_SYSCTL_RW_ENTRY(RP_FILTER, "rp_filter"),
1438 DEVINET_SYSCTL_RW_ENTRY(SEND_REDIRECTS, "send_redirects"),
1439 DEVINET_SYSCTL_RW_ENTRY(ACCEPT_SOURCE_ROUTE,
1440 "accept_source_route"),
1441 DEVINET_SYSCTL_RW_ENTRY(PROXY_ARP, "proxy_arp"),
1442 DEVINET_SYSCTL_RW_ENTRY(MEDIUM_ID, "medium_id"),
1443 DEVINET_SYSCTL_RW_ENTRY(BOOTP_RELAY, "bootp_relay"),
1444 DEVINET_SYSCTL_RW_ENTRY(LOG_MARTIANS, "log_martians"),
1445 DEVINET_SYSCTL_RW_ENTRY(TAG, "tag"),
1446 DEVINET_SYSCTL_RW_ENTRY(ARPFILTER, "arp_filter"),
1447 DEVINET_SYSCTL_RW_ENTRY(ARP_ANNOUNCE, "arp_announce"),
1448 DEVINET_SYSCTL_RW_ENTRY(ARP_IGNORE, "arp_ignore"),
1449 DEVINET_SYSCTL_RW_ENTRY(ARP_ACCEPT, "arp_accept"),
1451 DEVINET_SYSCTL_FLUSHING_ENTRY(NOXFRM, "disable_xfrm"),
1452 DEVINET_SYSCTL_FLUSHING_ENTRY(NOPOLICY, "disable_policy"),
1453 DEVINET_SYSCTL_FLUSHING_ENTRY(FORCE_IGMP_VERSION,
1454 "force_igmp_version"),
1455 DEVINET_SYSCTL_FLUSHING_ENTRY(PROMOTE_SECONDARIES,
1456 "promote_secondaries"),
1460 .ctl_name = NET_PROTO_CONF_ALL,
1463 .child = devinet_sysctl.devinet_vars,
1466 .devinet_conf_dir = {
1468 .ctl_name = NET_IPV4_CONF,
1471 .child = devinet_sysctl.devinet_dev,
1474 .devinet_proto_dir = {
1476 .ctl_name = NET_IPV4,
1479 .child = devinet_sysctl.devinet_conf_dir,
1482 .devinet_root_dir = {
1484 .ctl_name = CTL_NET,
1487 .child = devinet_sysctl.devinet_proto_dir,
1492 static void devinet_sysctl_register(struct in_device *in_dev,
1493 struct ipv4_devconf *p)
1496 struct net_device *dev = in_dev ? in_dev->dev : NULL;
1497 struct devinet_sysctl_table *t = kmemdup(&devinet_sysctl, sizeof(*t),
1499 char *dev_name = NULL;
1503 for (i = 0; i < ARRAY_SIZE(t->devinet_vars) - 1; i++) {
1504 t->devinet_vars[i].data += (char *)p - (char *)&ipv4_devconf;
1505 t->devinet_vars[i].extra1 = p;
1509 dev_name = dev->name;
1510 t->devinet_dev[0].ctl_name = dev->ifindex;
1512 dev_name = "default";
1513 t->devinet_dev[0].ctl_name = NET_PROTO_CONF_DEFAULT;
1517 * Make a copy of dev_name, because '.procname' is regarded as const
1518 * by sysctl and we wouldn't want anyone to change it under our feet
1519 * (see SIOCSIFNAME).
1521 dev_name = kstrdup(dev_name, GFP_KERNEL);
1525 t->devinet_dev[0].procname = dev_name;
1526 t->devinet_dev[0].child = t->devinet_vars;
1527 t->devinet_conf_dir[0].child = t->devinet_dev;
1528 t->devinet_proto_dir[0].child = t->devinet_conf_dir;
1529 t->devinet_root_dir[0].child = t->devinet_proto_dir;
1531 t->sysctl_header = register_sysctl_table(t->devinet_root_dir);
1532 if (!t->sysctl_header)
1546 static void devinet_sysctl_unregister(struct ipv4_devconf *p)
1549 struct devinet_sysctl_table *t = p->sysctl;
1551 unregister_sysctl_table(t->sysctl_header);
1552 kfree(t->devinet_dev[0].procname);
1558 void __init devinet_init(void)
1560 register_gifconf(PF_INET, inet_gifconf);
1561 register_netdevice_notifier(&ip_netdev_notifier);
1563 rtnl_register(PF_INET, RTM_NEWADDR, inet_rtm_newaddr, NULL);
1564 rtnl_register(PF_INET, RTM_DELADDR, inet_rtm_deladdr, NULL);
1565 rtnl_register(PF_INET, RTM_GETADDR, NULL, inet_dump_ifaddr);
1566 #ifdef CONFIG_SYSCTL
1567 devinet_sysctl.sysctl_header =
1568 register_sysctl_table(devinet_sysctl.devinet_root_dir);
1569 devinet_sysctl_register(NULL, &ipv4_devconf_dflt);
1573 EXPORT_SYMBOL(in_dev_finish_destroy);
1574 EXPORT_SYMBOL(inet_select_addr);
1575 EXPORT_SYMBOL(inetdev_by_index);
1576 EXPORT_SYMBOL(register_inetaddr_notifier);
1577 EXPORT_SYMBOL(unregister_inetaddr_notifier);