in.c revision 189931
1139823Simp/*-
21541Srgrimes * Copyright (c) 1982, 1986, 1991, 1993
31541Srgrimes *	The Regents of the University of California.  All rights reserved.
4137668Smlaier * Copyright (C) 2001 WIDE Project.  All rights reserved.
51541Srgrimes *
61541Srgrimes * Redistribution and use in source and binary forms, with or without
71541Srgrimes * modification, are permitted provided that the following conditions
81541Srgrimes * are met:
91541Srgrimes * 1. Redistributions of source code must retain the above copyright
101541Srgrimes *    notice, this list of conditions and the following disclaimer.
111541Srgrimes * 2. Redistributions in binary form must reproduce the above copyright
121541Srgrimes *    notice, this list of conditions and the following disclaimer in the
131541Srgrimes *    documentation and/or other materials provided with the distribution.
141541Srgrimes * 4. Neither the name of the University nor the names of its contributors
151541Srgrimes *    may be used to endorse or promote products derived from this software
161541Srgrimes *    without specific prior written permission.
171541Srgrimes *
181541Srgrimes * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
191541Srgrimes * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
201541Srgrimes * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
211541Srgrimes * ARE DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
221541Srgrimes * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
231541Srgrimes * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
241541Srgrimes * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
251541Srgrimes * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
261541Srgrimes * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
271541Srgrimes * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
281541Srgrimes * SUCH DAMAGE.
291541Srgrimes *
3010939Swollman *	@(#)in.c	8.4 (Berkeley) 1/9/95
311541Srgrimes */
321541Srgrimes
33172467Ssilby#include <sys/cdefs.h>
34172467Ssilby__FBSDID("$FreeBSD: head/sys/netinet/in.c 189931 2009-03-17 14:41:54Z bms $");
35172467Ssilby
36143868Sglebius#include "opt_carp.h"
37143868Sglebius
381541Srgrimes#include <sys/param.h>
391549Srgrimes#include <sys/systm.h>
4024204Sbde#include <sys/sockio.h>
411541Srgrimes#include <sys/malloc.h>
42164033Srwatson#include <sys/priv.h>
431541Srgrimes#include <sys/socket.h>
44186948Sbz#include <sys/jail.h>
4512704Sphk#include <sys/kernel.h>
46186948Sbz#include <sys/proc.h>
4712704Sphk#include <sys/sysctl.h>
48181803Sbz#include <sys/vimage.h>
491541Srgrimes
501541Srgrimes#include <net/if.h>
51186119Sqingli#include <net/if_llatbl.h>
5255009Sshin#include <net/if_types.h>
531541Srgrimes#include <net/route.h>
541541Srgrimes
551541Srgrimes#include <netinet/in.h>
561541Srgrimes#include <netinet/in_var.h>
5781127Sume#include <netinet/in_pcb.h>
58170613Sbms#include <netinet/ip_var.h>
59185571Sbz#include <netinet/vinet.h>
60189592Sbms#include <netinet/igmp_var.h>
611541Srgrimes
6292723Salfredstatic int in_mask2len(struct in_addr *);
6392723Salfredstatic void in_len2mask(struct in_addr *, int);
6492723Salfredstatic int in_lifaddr_ioctl(struct socket *, u_long, caddr_t,
6592723Salfred	struct ifnet *, struct thread *);
6655009Sshin
67137628Smlaierstatic int	in_addprefix(struct in_ifaddr *, int);
68137628Smlaierstatic int	in_scrubprefix(struct in_ifaddr *);
6992723Salfredstatic void	in_socktrim(struct sockaddr_in *);
7092723Salfredstatic int	in_ifinit(struct ifnet *,
7192723Salfred	    struct in_ifaddr *, struct sockaddr_in *, int);
72167729Sbmsstatic void	in_purgemaddrs(struct ifnet *);
731541Srgrimes
74185088Szec#ifdef VIMAGE_GLOBALS
75185088Szecstatic int subnetsarelocal;
76185088Szecstatic int sameprefixcarponly;
77185088Szecextern struct inpcbinfo ripcbinfo;
78185088Szec#endif
79185088Szec
80183550SzecSYSCTL_V_INT(V_NET, vnet_inet, _net_inet_ip, OID_AUTO, subnets_are_local,
81183550Szec	CTLFLAG_RW, subnetsarelocal, 0,
82183550Szec	"Treat all subnets as directly connected");
83183550SzecSYSCTL_V_INT(V_NET, vnet_inet, _net_inet_ip, OID_AUTO, same_prefix_carp_only,
84183550Szec	CTLFLAG_RW, sameprefixcarponly, 0,
85149221Sglebius	"Refuse to create same prefixes on different interfaces");
8621666Swollman
871541Srgrimes/*
881541Srgrimes * Return 1 if an internet address is for a ``local'' host
891541Srgrimes * (one to which we have a connection).  If subnetsarelocal
901541Srgrimes * is true, this includes other subnets of the local net.
911541Srgrimes * Otherwise, it includes only the directly-connected (sub)nets.
921541Srgrimes */
931549Srgrimesint
94169454Srwatsonin_localaddr(struct in_addr in)
951541Srgrimes{
96183550Szec	INIT_VNET_INET(curvnet);
971541Srgrimes	register u_long i = ntohl(in.s_addr);
981541Srgrimes	register struct in_ifaddr *ia;
991541Srgrimes
100181803Sbz	if (V_subnetsarelocal) {
101181803Sbz		TAILQ_FOREACH(ia, &V_in_ifaddrhead, ia_link)
1021541Srgrimes			if ((i & ia->ia_netmask) == ia->ia_net)
1031541Srgrimes				return (1);
1041541Srgrimes	} else {
105181803Sbz		TAILQ_FOREACH(ia, &V_in_ifaddrhead, ia_link)
1061541Srgrimes			if ((i & ia->ia_subnetmask) == ia->ia_subnet)
1071541Srgrimes				return (1);
1081541Srgrimes	}
1091541Srgrimes	return (0);
1101541Srgrimes}
1111541Srgrimes
1121541Srgrimes/*
113133486Sandre * Return 1 if an internet address is for the local host and configured
114133486Sandre * on one of its interfaces.
115133486Sandre */
116133486Sandreint
117169454Srwatsonin_localip(struct in_addr in)
118133486Sandre{
119183550Szec	INIT_VNET_INET(curvnet);
120133486Sandre	struct in_ifaddr *ia;
121133486Sandre
122133486Sandre	LIST_FOREACH(ia, INADDR_HASH(in.s_addr), ia_hash) {
123133486Sandre		if (IA_SIN(ia)->sin_addr.s_addr == in.s_addr)
124184295Sbz			return (1);
125133486Sandre	}
126184295Sbz	return (0);
127133486Sandre}
128133486Sandre
129133486Sandre/*
1301541Srgrimes * Determine whether an IP address is in a reserved set of addresses
1311541Srgrimes * that may not be forwarded, or whether datagrams to that destination
1321541Srgrimes * may be forwarded.
1331541Srgrimes */
1341549Srgrimesint
135169454Srwatsonin_canforward(struct in_addr in)
1361541Srgrimes{
1371541Srgrimes	register u_long i = ntohl(in.s_addr);
1381541Srgrimes	register u_long net;
1391541Srgrimes
140166450Sbms	if (IN_EXPERIMENTAL(i) || IN_MULTICAST(i) || IN_LINKLOCAL(i))
1411541Srgrimes		return (0);
1421541Srgrimes	if (IN_CLASSA(i)) {
1431541Srgrimes		net = i & IN_CLASSA_NET;
1441541Srgrimes		if (net == 0 || net == (IN_LOOPBACKNET << IN_CLASSA_NSHIFT))
1451541Srgrimes			return (0);
1461541Srgrimes	}
1471541Srgrimes	return (1);
1481541Srgrimes}
1491541Srgrimes
1501541Srgrimes/*
1511541Srgrimes * Trim a mask in a sockaddr
1521541Srgrimes */
15312296Sphkstatic void
154169454Srwatsonin_socktrim(struct sockaddr_in *ap)
1551541Srgrimes{
1561541Srgrimes    register char *cplim = (char *) &ap->sin_addr;
1571541Srgrimes    register char *cp = (char *) (&ap->sin_addr + 1);
1581541Srgrimes
1591541Srgrimes    ap->sin_len = 0;
1604127Swollman    while (--cp >= cplim)
161133874Srwatson	if (*cp) {
1621541Srgrimes	    (ap)->sin_len = cp - (char *) (ap) + 1;
1631541Srgrimes	    break;
1641541Srgrimes	}
1651541Srgrimes}
1661541Srgrimes
16755009Sshinstatic int
16855009Sshinin_mask2len(mask)
16955009Sshin	struct in_addr *mask;
17055009Sshin{
17155009Sshin	int x, y;
17255009Sshin	u_char *p;
17355009Sshin
17455009Sshin	p = (u_char *)mask;
17555009Sshin	for (x = 0; x < sizeof(*mask); x++) {
17655009Sshin		if (p[x] != 0xff)
17755009Sshin			break;
17855009Sshin	}
17955009Sshin	y = 0;
18055009Sshin	if (x < sizeof(*mask)) {
18155009Sshin		for (y = 0; y < 8; y++) {
18255009Sshin			if ((p[x] & (0x80 >> y)) == 0)
18355009Sshin				break;
18455009Sshin		}
18555009Sshin	}
186184295Sbz	return (x * 8 + y);
18755009Sshin}
18855009Sshin
18955009Sshinstatic void
190169454Srwatsonin_len2mask(struct in_addr *mask, int len)
19155009Sshin{
19255009Sshin	int i;
19355009Sshin	u_char *p;
19455009Sshin
19555009Sshin	p = (u_char *)mask;
19655009Sshin	bzero(mask, sizeof(*mask));
19755009Sshin	for (i = 0; i < len / 8; i++)
19855009Sshin		p[i] = 0xff;
19955009Sshin	if (len % 8)
20055009Sshin		p[i] = (0xff00 >> (len % 8)) & 0xff;
20155009Sshin}
20255009Sshin
2031541Srgrimes/*
2041541Srgrimes * Generic internet control operations (ioctl's).
2051541Srgrimes * Ifp is 0 if not an interface-specific ioctl.
2061541Srgrimes */
2071541Srgrimes/* ARGSUSED */
2081549Srgrimesint
209169454Srwatsonin_control(struct socket *so, u_long cmd, caddr_t data, struct ifnet *ifp,
210169454Srwatson    struct thread *td)
2111541Srgrimes{
212183550Szec	INIT_VNET_INET(curvnet); /* both so and ifp can be NULL here! */
2131541Srgrimes	register struct ifreq *ifr = (struct ifreq *)data;
214184295Sbz	register struct in_ifaddr *ia, *iap;
2151541Srgrimes	register struct ifaddr *ifa;
216168032Sbms	struct in_addr allhosts_addr;
21784102Sjlemon	struct in_addr dst;
2181541Srgrimes	struct in_ifaddr *oia;
219189592Sbms	struct in_ifinfo *ii;
2201541Srgrimes	struct in_aliasreq *ifra = (struct in_aliasreq *)data;
2211541Srgrimes	struct sockaddr_in oldaddr;
22287124Sbrian	int error, hostIsNew, iaIsNew, maskIsNew, s;
223168032Sbms	int iaIsFirst;
2241541Srgrimes
225184295Sbz	ia = NULL;
226168032Sbms	iaIsFirst = 0;
22787124Sbrian	iaIsNew = 0;
228168032Sbms	allhosts_addr.s_addr = htonl(INADDR_ALLHOSTS_GROUP);
22987124Sbrian
23055009Sshin	switch (cmd) {
23155009Sshin	case SIOCALIFADDR:
232164033Srwatson		if (td != NULL) {
233164033Srwatson			error = priv_check(td, PRIV_NET_ADDIFADDR);
234164033Srwatson			if (error)
235164033Srwatson				return (error);
236164033Srwatson		}
237184295Sbz		if (ifp == NULL)
238184295Sbz			return (EINVAL);
239164033Srwatson		return in_lifaddr_ioctl(so, cmd, data, ifp, td);
240164033Srwatson
24155009Sshin	case SIOCDLIFADDR:
242164033Srwatson		if (td != NULL) {
243164033Srwatson			error = priv_check(td, PRIV_NET_DELIFADDR);
244164033Srwatson			if (error)
245164033Srwatson				return (error);
246164033Srwatson		}
247184295Sbz		if (ifp == NULL)
248184295Sbz			return (EINVAL);
249164033Srwatson		return in_lifaddr_ioctl(so, cmd, data, ifp, td);
250164033Srwatson
25155009Sshin	case SIOCGLIFADDR:
252184295Sbz		if (ifp == NULL)
253184295Sbz			return (EINVAL);
25483366Sjulian		return in_lifaddr_ioctl(so, cmd, data, ifp, td);
25555009Sshin	}
25655009Sshin
2571541Srgrimes	/*
2581541Srgrimes	 * Find address for this interface, if it exists.
25914632Sfenner	 *
26014632Sfenner	 * If an alias address was specified, find that one instead of
26184102Sjlemon	 * the first one on the interface, if possible.
2621541Srgrimes	 */
263184295Sbz	if (ifp != NULL) {
26484102Sjlemon		dst = ((struct sockaddr_in *)&ifr->ifr_addr)->sin_addr;
26584102Sjlemon		LIST_FOREACH(iap, INADDR_HASH(dst.s_addr), ia_hash)
26684102Sjlemon			if (iap->ia_ifp == ifp &&
26784102Sjlemon			    iap->ia_addr.sin_addr.s_addr == dst.s_addr) {
268186948Sbz				if (td == NULL || prison_check_ip4(
269188144Sjamie				    td->td_ucred, &dst) == 0)
270186948Sbz					ia = iap;
27184102Sjlemon				break;
27284102Sjlemon			}
27384102Sjlemon		if (ia == NULL)
27484102Sjlemon			TAILQ_FOREACH(ifa, &ifp->if_addrhead, ifa_link) {
27584102Sjlemon				iap = ifatoia(ifa);
27684102Sjlemon				if (iap->ia_addr.sin_family == AF_INET) {
277186948Sbz					if (td != NULL &&
278188144Sjamie					    prison_check_ip4(td->td_ucred,
279188144Sjamie					    &iap->ia_addr.sin_addr) != 0)
280186948Sbz						continue;
28114632Sfenner					ia = iap;
28214632Sfenner					break;
28314632Sfenner				}
28414632Sfenner			}
285168032Sbms		if (ia == NULL)
286168032Sbms			iaIsFirst = 1;
28784102Sjlemon	}
2881541Srgrimes
2891541Srgrimes	switch (cmd) {
2901541Srgrimes
2911541Srgrimes	case SIOCAIFADDR:
2921541Srgrimes	case SIOCDIFADDR:
293184295Sbz		if (ifp == NULL)
29441575Seivind			return (EADDRNOTAVAIL);
2958071Swollman		if (ifra->ifra_addr.sin_family == AF_INET) {
29671999Sphk			for (oia = ia; ia; ia = TAILQ_NEXT(ia, ia_link)) {
2978071Swollman				if (ia->ia_ifp == ifp  &&
2988071Swollman				    ia->ia_addr.sin_addr.s_addr ==
2998071Swollman				    ifra->ifra_addr.sin_addr.s_addr)
3008071Swollman					break;
3018071Swollman			}
3028876Srgrimes			if ((ifp->if_flags & IFF_POINTOPOINT)
3038071Swollman			    && (cmd == SIOCAIFADDR)
3048071Swollman			    && (ifra->ifra_dstaddr.sin_addr.s_addr
3058071Swollman				== INADDR_ANY)) {
306184295Sbz				return (EDESTADDRREQ);
3078071Swollman			}
3081541Srgrimes		}
309184295Sbz		if (cmd == SIOCDIFADDR && ia == NULL)
3101541Srgrimes			return (EADDRNOTAVAIL);
3111541Srgrimes		/* FALLTHROUGH */
3121541Srgrimes	case SIOCSIFADDR:
3131541Srgrimes	case SIOCSIFNETMASK:
3141541Srgrimes	case SIOCSIFDSTADDR:
315164033Srwatson		if (td != NULL) {
316175626Sbz			error = priv_check(td, (cmd == SIOCDIFADDR) ?
317175626Sbz			    PRIV_NET_DELIFADDR : PRIV_NET_ADDIFADDR);
318164033Srwatson			if (error)
319164033Srwatson				return (error);
320164033Srwatson		}
3211541Srgrimes
322184295Sbz		if (ifp == NULL)
32341575Seivind			return (EADDRNOTAVAIL);
324184295Sbz		if (ia == NULL) {
32520407Swollman			ia = (struct in_ifaddr *)
326111119Simp				malloc(sizeof *ia, M_IFADDR, M_WAITOK | M_ZERO);
327184295Sbz			if (ia == NULL)
3281541Srgrimes				return (ENOBUFS);
32915092Sdg			/*
33015092Sdg			 * Protect from ipintr() traversing address list
33115092Sdg			 * while we're modifying it.
33215092Sdg			 */
33315092Sdg			s = splnet();
33420407Swollman			ifa = &ia->ia_ifa;
335108033Shsu			IFA_LOCK_INIT(ifa);
33620407Swollman			ifa->ifa_addr = (struct sockaddr *)&ia->ia_addr;
33720407Swollman			ifa->ifa_dstaddr = (struct sockaddr *)&ia->ia_dstaddr;
33820407Swollman			ifa->ifa_netmask = (struct sockaddr *)&ia->ia_sockmask;
339108033Shsu			ifa->ifa_refcnt = 1;
340108033Shsu			TAILQ_INSERT_TAIL(&ifp->if_addrhead, ifa, ifa_link);
341108033Shsu
3421541Srgrimes			ia->ia_sockmask.sin_len = 8;
34385740Sdes			ia->ia_sockmask.sin_family = AF_INET;
3441541Srgrimes			if (ifp->if_flags & IFF_BROADCAST) {
3451541Srgrimes				ia->ia_broadaddr.sin_len = sizeof(ia->ia_addr);
3461541Srgrimes				ia->ia_broadaddr.sin_family = AF_INET;
3471541Srgrimes			}
3481541Srgrimes			ia->ia_ifp = ifp;
349151824Sglebius
350181803Sbz			TAILQ_INSERT_TAIL(&V_in_ifaddrhead, ia, ia_link);
35115092Sdg			splx(s);
35287124Sbrian			iaIsNew = 1;
3531541Srgrimes		}
3541541Srgrimes		break;
3551541Srgrimes
3561541Srgrimes	case SIOCSIFBRDADDR:
357164033Srwatson		if (td != NULL) {
358164033Srwatson			error = priv_check(td, PRIV_NET_ADDIFADDR);
359164033Srwatson			if (error)
360164033Srwatson				return (error);
361164033Srwatson		}
3621541Srgrimes		/* FALLTHROUGH */
3631541Srgrimes
3641541Srgrimes	case SIOCGIFADDR:
3651541Srgrimes	case SIOCGIFNETMASK:
3661541Srgrimes	case SIOCGIFDSTADDR:
3671541Srgrimes	case SIOCGIFBRDADDR:
368184295Sbz		if (ia == NULL)
3691541Srgrimes			return (EADDRNOTAVAIL);
3701541Srgrimes		break;
3711541Srgrimes	}
3721541Srgrimes	switch (cmd) {
3731541Srgrimes
3741541Srgrimes	case SIOCGIFADDR:
3751541Srgrimes		*((struct sockaddr_in *)&ifr->ifr_addr) = ia->ia_addr;
37687124Sbrian		return (0);
3771541Srgrimes
3781541Srgrimes	case SIOCGIFBRDADDR:
3791541Srgrimes		if ((ifp->if_flags & IFF_BROADCAST) == 0)
3801541Srgrimes			return (EINVAL);
3811541Srgrimes		*((struct sockaddr_in *)&ifr->ifr_dstaddr) = ia->ia_broadaddr;
38287124Sbrian		return (0);
3831541Srgrimes
3841541Srgrimes	case SIOCGIFDSTADDR:
3851541Srgrimes		if ((ifp->if_flags & IFF_POINTOPOINT) == 0)
3861541Srgrimes			return (EINVAL);
3871541Srgrimes		*((struct sockaddr_in *)&ifr->ifr_dstaddr) = ia->ia_dstaddr;
38887124Sbrian		return (0);
3891541Srgrimes
3901541Srgrimes	case SIOCGIFNETMASK:
3911541Srgrimes		*((struct sockaddr_in *)&ifr->ifr_addr) = ia->ia_sockmask;
39287124Sbrian		return (0);
3931541Srgrimes
3941541Srgrimes	case SIOCSIFDSTADDR:
3951541Srgrimes		if ((ifp->if_flags & IFF_POINTOPOINT) == 0)
3961541Srgrimes			return (EINVAL);
3971541Srgrimes		oldaddr = ia->ia_dstaddr;
3981541Srgrimes		ia->ia_dstaddr = *(struct sockaddr_in *)&ifr->ifr_dstaddr;
399184295Sbz		if (ifp->if_ioctl != NULL) {
400146883Siedowse			error = (*ifp->if_ioctl)(ifp, SIOCSIFDSTADDR,
401146883Siedowse			    (caddr_t)ia);
402146883Siedowse			if (error) {
403146883Siedowse				ia->ia_dstaddr = oldaddr;
404146883Siedowse				return (error);
405146883Siedowse			}
4061541Srgrimes		}
4071541Srgrimes		if (ia->ia_flags & IFA_ROUTE) {
4081541Srgrimes			ia->ia_ifa.ifa_dstaddr = (struct sockaddr *)&oldaddr;
4091541Srgrimes			rtinit(&(ia->ia_ifa), (int)RTM_DELETE, RTF_HOST);
4101541Srgrimes			ia->ia_ifa.ifa_dstaddr =
4111541Srgrimes					(struct sockaddr *)&ia->ia_dstaddr;
4121541Srgrimes			rtinit(&(ia->ia_ifa), (int)RTM_ADD, RTF_HOST|RTF_UP);
4131541Srgrimes		}
41487124Sbrian		return (0);
4151541Srgrimes
4161541Srgrimes	case SIOCSIFBRDADDR:
4171541Srgrimes		if ((ifp->if_flags & IFF_BROADCAST) == 0)
4181541Srgrimes			return (EINVAL);
4191541Srgrimes		ia->ia_broadaddr = *(struct sockaddr_in *)&ifr->ifr_broadaddr;
42087124Sbrian		return (0);
4211541Srgrimes
4221541Srgrimes	case SIOCSIFADDR:
42387124Sbrian		error = in_ifinit(ifp, ia,
42487124Sbrian		    (struct sockaddr_in *) &ifr->ifr_addr, 1);
42587124Sbrian		if (error != 0 && iaIsNew)
42687124Sbrian			break;
427168032Sbms		if (error == 0) {
428189603Sbms			ii = ((struct in_ifinfo *)ifp->if_afdata[AF_INET]);
429189592Sbms			if (iaIsFirst &&
430189592Sbms			    (ifp->if_flags & IFF_MULTICAST) != 0) {
431189592Sbms				error = in_joingroup(ifp, &allhosts_addr,
432189592Sbms				    NULL, &ii->ii_allhosts);
433189592Sbms			}
434126264Smlaier			EVENTHANDLER_INVOKE(ifaddr_event, ifp);
435168032Sbms		}
43687124Sbrian		return (0);
4371541Srgrimes
4381541Srgrimes	case SIOCSIFNETMASK:
43985740Sdes		ia->ia_sockmask.sin_addr = ifra->ifra_addr.sin_addr;
44085740Sdes		ia->ia_subnetmask = ntohl(ia->ia_sockmask.sin_addr.s_addr);
44187124Sbrian		return (0);
4421541Srgrimes
4431541Srgrimes	case SIOCAIFADDR:
4441541Srgrimes		maskIsNew = 0;
4451541Srgrimes		hostIsNew = 1;
4461541Srgrimes		error = 0;
4471541Srgrimes		if (ia->ia_addr.sin_family == AF_INET) {
4481541Srgrimes			if (ifra->ifra_addr.sin_len == 0) {
4491541Srgrimes				ifra->ifra_addr = ia->ia_addr;
4501541Srgrimes				hostIsNew = 0;
4511541Srgrimes			} else if (ifra->ifra_addr.sin_addr.s_addr ==
4521541Srgrimes					       ia->ia_addr.sin_addr.s_addr)
4531541Srgrimes				hostIsNew = 0;
4541541Srgrimes		}
4551541Srgrimes		if (ifra->ifra_mask.sin_len) {
4561541Srgrimes			in_ifscrub(ifp, ia);
4571541Srgrimes			ia->ia_sockmask = ifra->ifra_mask;
45885740Sdes			ia->ia_sockmask.sin_family = AF_INET;
4591541Srgrimes			ia->ia_subnetmask =
4601541Srgrimes			     ntohl(ia->ia_sockmask.sin_addr.s_addr);
4611541Srgrimes			maskIsNew = 1;
4621541Srgrimes		}
4631541Srgrimes		if ((ifp->if_flags & IFF_POINTOPOINT) &&
4641541Srgrimes		    (ifra->ifra_dstaddr.sin_family == AF_INET)) {
4651541Srgrimes			in_ifscrub(ifp, ia);
4661541Srgrimes			ia->ia_dstaddr = ifra->ifra_dstaddr;
4671541Srgrimes			maskIsNew  = 1; /* We lie; but the effect's the same */
4681541Srgrimes		}
4691541Srgrimes		if (ifra->ifra_addr.sin_family == AF_INET &&
4701541Srgrimes		    (hostIsNew || maskIsNew))
4711541Srgrimes			error = in_ifinit(ifp, ia, &ifra->ifra_addr, 0);
47287124Sbrian		if (error != 0 && iaIsNew)
47387124Sbrian			break;
47487124Sbrian
4751541Srgrimes		if ((ifp->if_flags & IFF_BROADCAST) &&
4761541Srgrimes		    (ifra->ifra_broadaddr.sin_family == AF_INET))
4771541Srgrimes			ia->ia_broadaddr = ifra->ifra_broadaddr;
478168032Sbms		if (error == 0) {
479189603Sbms			ii = ((struct in_ifinfo *)ifp->if_afdata[AF_INET]);
480189592Sbms			if (iaIsFirst &&
481189592Sbms			    (ifp->if_flags & IFF_MULTICAST) != 0) {
482189592Sbms				error = in_joingroup(ifp, &allhosts_addr,
483189592Sbms				    NULL, &ii->ii_allhosts);
484189592Sbms			}
485126264Smlaier			EVENTHANDLER_INVOKE(ifaddr_event, ifp);
486168032Sbms		}
4871541Srgrimes		return (error);
4881541Srgrimes
4891541Srgrimes	case SIOCDIFADDR:
49074299Sru		/*
49174299Sru		 * in_ifscrub kills the interface route.
49274299Sru		 */
4931541Srgrimes		in_ifscrub(ifp, ia);
49415092Sdg		/*
49574299Sru		 * in_ifadown gets rid of all the rest of
49674299Sru		 * the routes.  This is not quite the right
49774299Sru		 * thing to do, but at least if we are running
49874299Sru		 * a routing process they will come back.
49974299Sru		 */
50076469Sru		in_ifadown(&ia->ia_ifa, 1);
501126264Smlaier		EVENTHANDLER_INVOKE(ifaddr_event, ifp);
50287124Sbrian		error = 0;
5031541Srgrimes		break;
5041541Srgrimes
5051541Srgrimes	default:
506184295Sbz		if (ifp == NULL || ifp->if_ioctl == NULL)
5071541Srgrimes			return (EOPNOTSUPP);
508189851Srwatson		return ((*ifp->if_ioctl)(ifp, cmd, data));
5091541Srgrimes	}
51087124Sbrian
51187124Sbrian	/*
51287124Sbrian	 * Protect from ipintr() traversing address list while we're modifying
51387124Sbrian	 * it.
51487124Sbrian	 */
51587124Sbrian	s = splnet();
51687124Sbrian	TAILQ_REMOVE(&ifp->if_addrhead, &ia->ia_ifa, ifa_link);
517181803Sbz	TAILQ_REMOVE(&V_in_ifaddrhead, ia, ia_link);
518168032Sbms	if (ia->ia_addr.sin_family == AF_INET) {
519154777Sandre		LIST_REMOVE(ia, ia_hash);
520168032Sbms		/*
521168032Sbms		 * If this is the last IPv4 address configured on this
522168032Sbms		 * interface, leave the all-hosts group.
523189592Sbms		 * No state-change report need be transmitted.
524168032Sbms		 */
525168032Sbms		oia = NULL;
526168032Sbms		IFP_TO_IA(ifp, oia);
527168032Sbms		if (oia == NULL) {
528189603Sbms			ii = ((struct in_ifinfo *)ifp->if_afdata[AF_INET]);
529168032Sbms			IN_MULTI_LOCK();
530189592Sbms			if (ii->ii_allhosts) {
531189592Sbms				(void)in_leavegroup_locked(ii->ii_allhosts,
532189592Sbms				    NULL);
533189592Sbms				ii->ii_allhosts = NULL;
534189592Sbms			}
535168032Sbms			IN_MULTI_UNLOCK();
536168032Sbms		}
537168032Sbms	}
53887124Sbrian	IFAFREE(&ia->ia_ifa);
53987124Sbrian	splx(s);
54087124Sbrian
54187124Sbrian	return (error);
5421541Srgrimes}
5431541Srgrimes
5441541Srgrimes/*
54555009Sshin * SIOC[GAD]LIFADDR.
54655009Sshin *	SIOCGLIFADDR: get first address. (?!?)
54755009Sshin *	SIOCGLIFADDR with IFLR_PREFIX:
54855009Sshin *		get first address that matches the specified prefix.
54955009Sshin *	SIOCALIFADDR: add the specified address.
55055009Sshin *	SIOCALIFADDR with IFLR_PREFIX:
55155009Sshin *		EINVAL since we can't deduce hostid part of the address.
55255009Sshin *	SIOCDLIFADDR: delete the specified address.
55355009Sshin *	SIOCDLIFADDR with IFLR_PREFIX:
55455009Sshin *		delete the first address that matches the specified prefix.
55555009Sshin * return values:
55655009Sshin *	EINVAL on invalid parameters
55755009Sshin *	EADDRNOTAVAIL on prefix match failed/specified address not found
55855009Sshin *	other values may be returned from in_ioctl()
55955009Sshin */
56055009Sshinstatic int
561169454Srwatsonin_lifaddr_ioctl(struct socket *so, u_long cmd, caddr_t data,
562169454Srwatson    struct ifnet *ifp, struct thread *td)
56355009Sshin{
56455009Sshin	struct if_laddrreq *iflr = (struct if_laddrreq *)data;
56555009Sshin	struct ifaddr *ifa;
56655009Sshin
56755009Sshin	/* sanity checks */
568184295Sbz	if (data == NULL || ifp == NULL) {
56955009Sshin		panic("invalid argument to in_lifaddr_ioctl");
57055009Sshin		/*NOTRECHED*/
57155009Sshin	}
57255009Sshin
57355009Sshin	switch (cmd) {
57455009Sshin	case SIOCGLIFADDR:
57555009Sshin		/* address must be specified on GET with IFLR_PREFIX */
57655009Sshin		if ((iflr->flags & IFLR_PREFIX) == 0)
57755009Sshin			break;
57855009Sshin		/*FALLTHROUGH*/
57955009Sshin	case SIOCALIFADDR:
58055009Sshin	case SIOCDLIFADDR:
58155009Sshin		/* address must be specified on ADD and DELETE */
58255917Sshin		if (iflr->addr.ss_family != AF_INET)
583184295Sbz			return (EINVAL);
58455917Sshin		if (iflr->addr.ss_len != sizeof(struct sockaddr_in))
585184295Sbz			return (EINVAL);
58655009Sshin		/* XXX need improvement */
58755917Sshin		if (iflr->dstaddr.ss_family
58855917Sshin		 && iflr->dstaddr.ss_family != AF_INET)
589184295Sbz			return (EINVAL);
59055917Sshin		if (iflr->dstaddr.ss_family
59155917Sshin		 && iflr->dstaddr.ss_len != sizeof(struct sockaddr_in))
592184295Sbz			return (EINVAL);
59355009Sshin		break;
59455009Sshin	default: /*shouldn't happen*/
595184295Sbz		return (EOPNOTSUPP);
59655009Sshin	}
59755009Sshin	if (sizeof(struct in_addr) * 8 < iflr->prefixlen)
598184295Sbz		return (EINVAL);
59955009Sshin
60055009Sshin	switch (cmd) {
60155009Sshin	case SIOCALIFADDR:
60255009Sshin	    {
60355009Sshin		struct in_aliasreq ifra;
60455009Sshin
60555009Sshin		if (iflr->flags & IFLR_PREFIX)
606184295Sbz			return (EINVAL);
60755009Sshin
60855009Sshin		/* copy args to in_aliasreq, perform ioctl(SIOCAIFADDR_IN6). */
60955009Sshin		bzero(&ifra, sizeof(ifra));
61055009Sshin		bcopy(iflr->iflr_name, ifra.ifra_name,
61155009Sshin			sizeof(ifra.ifra_name));
61255009Sshin
61355917Sshin		bcopy(&iflr->addr, &ifra.ifra_addr, iflr->addr.ss_len);
61455009Sshin
61555917Sshin		if (iflr->dstaddr.ss_family) {	/*XXX*/
61655009Sshin			bcopy(&iflr->dstaddr, &ifra.ifra_dstaddr,
61755917Sshin				iflr->dstaddr.ss_len);
61855009Sshin		}
61955009Sshin
62055009Sshin		ifra.ifra_mask.sin_family = AF_INET;
62155009Sshin		ifra.ifra_mask.sin_len = sizeof(struct sockaddr_in);
62255009Sshin		in_len2mask(&ifra.ifra_mask.sin_addr, iflr->prefixlen);
62355009Sshin
624184295Sbz		return (in_control(so, SIOCAIFADDR, (caddr_t)&ifra, ifp, td));
62555009Sshin	    }
62655009Sshin	case SIOCGLIFADDR:
62755009Sshin	case SIOCDLIFADDR:
62855009Sshin	    {
62955009Sshin		struct in_ifaddr *ia;
63055009Sshin		struct in_addr mask, candidate, match;
63155009Sshin		struct sockaddr_in *sin;
63255009Sshin
63355009Sshin		bzero(&mask, sizeof(mask));
634170855Smjacob		bzero(&match, sizeof(match));
63555009Sshin		if (iflr->flags & IFLR_PREFIX) {
63655009Sshin			/* lookup a prefix rather than address. */
63755009Sshin			in_len2mask(&mask, iflr->prefixlen);
63855009Sshin
63955009Sshin			sin = (struct sockaddr_in *)&iflr->addr;
64055009Sshin			match.s_addr = sin->sin_addr.s_addr;
64155009Sshin			match.s_addr &= mask.s_addr;
64255009Sshin
64355009Sshin			/* if you set extra bits, that's wrong */
64455009Sshin			if (match.s_addr != sin->sin_addr.s_addr)
645184295Sbz				return (EINVAL);
64655009Sshin
64755009Sshin		} else {
648170855Smjacob			/* on getting an address, take the 1st match */
649170855Smjacob			/* on deleting an address, do exact match */
650170855Smjacob			if (cmd != SIOCGLIFADDR) {
65155009Sshin				in_len2mask(&mask, 32);
65255009Sshin				sin = (struct sockaddr_in *)&iflr->addr;
65355009Sshin				match.s_addr = sin->sin_addr.s_addr;
65455009Sshin			}
65555009Sshin		}
65655009Sshin
65755009Sshin		TAILQ_FOREACH(ifa, &ifp->if_addrhead, ifa_link)	{
65855009Sshin			if (ifa->ifa_addr->sa_family != AF_INET6)
65955009Sshin				continue;
660170855Smjacob			if (match.s_addr == 0)
66155009Sshin				break;
66255009Sshin			candidate.s_addr = ((struct sockaddr_in *)&ifa->ifa_addr)->sin_addr.s_addr;
66355009Sshin			candidate.s_addr &= mask.s_addr;
66455009Sshin			if (candidate.s_addr == match.s_addr)
66555009Sshin				break;
66655009Sshin		}
667184295Sbz		if (ifa == NULL)
668184295Sbz			return (EADDRNOTAVAIL);
66955009Sshin		ia = (struct in_ifaddr *)ifa;
67055009Sshin
67155009Sshin		if (cmd == SIOCGLIFADDR) {
67255009Sshin			/* fill in the if_laddrreq structure */
67355009Sshin			bcopy(&ia->ia_addr, &iflr->addr, ia->ia_addr.sin_len);
67455009Sshin
67555009Sshin			if ((ifp->if_flags & IFF_POINTOPOINT) != 0) {
67655009Sshin				bcopy(&ia->ia_dstaddr, &iflr->dstaddr,
67755009Sshin					ia->ia_dstaddr.sin_len);
67855009Sshin			} else
67955009Sshin				bzero(&iflr->dstaddr, sizeof(iflr->dstaddr));
68055009Sshin
68155009Sshin			iflr->prefixlen =
68255009Sshin				in_mask2len(&ia->ia_sockmask.sin_addr);
68355009Sshin
68455009Sshin			iflr->flags = 0;	/*XXX*/
68555009Sshin
686184295Sbz			return (0);
68755009Sshin		} else {
68855009Sshin			struct in_aliasreq ifra;
68955009Sshin
69055009Sshin			/* fill in_aliasreq and do ioctl(SIOCDIFADDR_IN6) */
69155009Sshin			bzero(&ifra, sizeof(ifra));
69255009Sshin			bcopy(iflr->iflr_name, ifra.ifra_name,
69355009Sshin				sizeof(ifra.ifra_name));
69455009Sshin
69555009Sshin			bcopy(&ia->ia_addr, &ifra.ifra_addr,
69655009Sshin				ia->ia_addr.sin_len);
69755009Sshin			if ((ifp->if_flags & IFF_POINTOPOINT) != 0) {
69855009Sshin				bcopy(&ia->ia_dstaddr, &ifra.ifra_dstaddr,
69955009Sshin					ia->ia_dstaddr.sin_len);
70055009Sshin			}
70155009Sshin			bcopy(&ia->ia_sockmask, &ifra.ifra_dstaddr,
70255009Sshin				ia->ia_sockmask.sin_len);
70355009Sshin
704184295Sbz			return (in_control(so, SIOCDIFADDR, (caddr_t)&ifra,
705184295Sbz			    ifp, td));
70655009Sshin		}
70755009Sshin	    }
70855009Sshin	}
70955009Sshin
710184295Sbz	return (EOPNOTSUPP);	/*just for safety*/
71155009Sshin}
71255009Sshin
71355009Sshin/*
7141541Srgrimes * Delete any existing route for an interface.
7151541Srgrimes */
71622672Swollmanvoid
717169454Srwatsonin_ifscrub(struct ifnet *ifp, struct in_ifaddr *ia)
7181541Srgrimes{
719169454Srwatson
720137628Smlaier	in_scrubprefix(ia);
7211541Srgrimes}
7221541Srgrimes
7231541Srgrimes/*
7241541Srgrimes * Initialize an interface's internet address
7251541Srgrimes * and routing table entry.
7261541Srgrimes */
72712296Sphkstatic int
728169454Srwatsonin_ifinit(struct ifnet *ifp, struct in_ifaddr *ia, struct sockaddr_in *sin,
729169454Srwatson    int scrub)
7301541Srgrimes{
731183550Szec	INIT_VNET_INET(ifp->if_vnet);
7321541Srgrimes	register u_long i = ntohl(sin->sin_addr.s_addr);
7331541Srgrimes	struct sockaddr_in oldaddr;
73494326Sbrian	int s = splimp(), flags = RTF_UP, error = 0;
7351541Srgrimes
7361541Srgrimes	oldaddr = ia->ia_addr;
737105748Ssuz	if (oldaddr.sin_family == AF_INET)
738105748Ssuz		LIST_REMOVE(ia, ia_hash);
7391541Srgrimes	ia->ia_addr = *sin;
740105748Ssuz	if (ia->ia_addr.sin_family == AF_INET)
741105748Ssuz		LIST_INSERT_HEAD(INADDR_HASH(ia->ia_addr.sin_addr.s_addr),
742105748Ssuz		    ia, ia_hash);
7431541Srgrimes	/*
7441541Srgrimes	 * Give the interface a chance to initialize
7451541Srgrimes	 * if this is its first address,
7461541Srgrimes	 * and to validate the address if necessary.
7471541Srgrimes	 */
748184295Sbz	if (ifp->if_ioctl != NULL) {
749146883Siedowse		error = (*ifp->if_ioctl)(ifp, SIOCSIFADDR, (caddr_t)ia);
750146883Siedowse		if (error) {
751146883Siedowse			splx(s);
752146883Siedowse			/* LIST_REMOVE(ia, ia_hash) is done in in_control */
753146883Siedowse			ia->ia_addr = oldaddr;
754146883Siedowse			if (ia->ia_addr.sin_family == AF_INET)
755146883Siedowse				LIST_INSERT_HEAD(INADDR_HASH(
756146883Siedowse				    ia->ia_addr.sin_addr.s_addr), ia, ia_hash);
757179971Sgonzo			else
758179971Sgonzo				/*
759179971Sgonzo				 * If oldaddr family is not AF_INET (e.g.
760179971Sgonzo				 * interface has been just created) in_control
761179971Sgonzo				 * does not call LIST_REMOVE, and we end up
762179971Sgonzo				 * with bogus ia entries in hash
763179971Sgonzo				 */
764179971Sgonzo				LIST_REMOVE(ia, ia_hash);
765146883Siedowse			return (error);
766146883Siedowse		}
7671541Srgrimes	}
7681541Srgrimes	splx(s);
7691541Srgrimes	if (scrub) {
7701541Srgrimes		ia->ia_ifa.ifa_addr = (struct sockaddr *)&oldaddr;
7711541Srgrimes		in_ifscrub(ifp, ia);
7721541Srgrimes		ia->ia_ifa.ifa_addr = (struct sockaddr *)&ia->ia_addr;
7731541Srgrimes	}
7741541Srgrimes	if (IN_CLASSA(i))
7751541Srgrimes		ia->ia_netmask = IN_CLASSA_NET;
7761541Srgrimes	else if (IN_CLASSB(i))
7771541Srgrimes		ia->ia_netmask = IN_CLASSB_NET;
7781541Srgrimes	else
7791541Srgrimes		ia->ia_netmask = IN_CLASSC_NET;
7801541Srgrimes	/*
7811541Srgrimes	 * The subnet mask usually includes at least the standard network part,
7821541Srgrimes	 * but may may be smaller in the case of supernetting.
7831541Srgrimes	 * If it is set, we believe it.
7841541Srgrimes	 */
7851541Srgrimes	if (ia->ia_subnetmask == 0) {
7861541Srgrimes		ia->ia_subnetmask = ia->ia_netmask;
7871541Srgrimes		ia->ia_sockmask.sin_addr.s_addr = htonl(ia->ia_subnetmask);
7881541Srgrimes	} else
7891541Srgrimes		ia->ia_netmask &= ia->ia_subnetmask;
7901541Srgrimes	ia->ia_net = i & ia->ia_netmask;
7911541Srgrimes	ia->ia_subnet = i & ia->ia_subnetmask;
7921541Srgrimes	in_socktrim(&ia->ia_sockmask);
793143868Sglebius#ifdef DEV_CARP
7941541Srgrimes	/*
795143868Sglebius	 * XXX: carp(4) does not have interface route
796143868Sglebius	 */
797143868Sglebius	if (ifp->if_type == IFT_CARP)
798143868Sglebius		return (0);
799143868Sglebius#endif
800143868Sglebius	/*
8011541Srgrimes	 * Add route for the network.
8021541Srgrimes	 */
8031541Srgrimes	ia->ia_ifa.ifa_metric = ifp->if_metric;
8041541Srgrimes	if (ifp->if_flags & IFF_BROADCAST) {
8051541Srgrimes		ia->ia_broadaddr.sin_addr.s_addr =
8061541Srgrimes			htonl(ia->ia_subnet | ~ia->ia_subnetmask);
8071541Srgrimes		ia->ia_netbroadcast.s_addr =
8081541Srgrimes			htonl(ia->ia_net | ~ ia->ia_netmask);
8091541Srgrimes	} else if (ifp->if_flags & IFF_LOOPBACK) {
810137833Smlaier		ia->ia_dstaddr = ia->ia_addr;
8111541Srgrimes		flags |= RTF_HOST;
8121541Srgrimes	} else if (ifp->if_flags & IFF_POINTOPOINT) {
8131541Srgrimes		if (ia->ia_dstaddr.sin_family != AF_INET)
8141541Srgrimes			return (0);
8151541Srgrimes		flags |= RTF_HOST;
8161541Srgrimes	}
817137628Smlaier	if ((error = in_addprefix(ia, flags)) != 0)
818137628Smlaier		return (error);
81994326Sbrian
8201541Srgrimes	return (error);
8211541Srgrimes}
8221541Srgrimes
823137628Smlaier#define rtinitflags(x) \
824137628Smlaier	((((x)->ia_ifp->if_flags & (IFF_LOOPBACK | IFF_POINTOPOINT)) != 0) \
825137628Smlaier	    ? RTF_HOST : 0)
826137628Smlaier/*
827170855Smjacob * Check if we have a route for the given prefix already or add one accordingly.
828137628Smlaier */
829137628Smlaierstatic int
830169454Srwatsonin_addprefix(struct in_ifaddr *target, int flags)
831137628Smlaier{
832183550Szec	INIT_VNET_INET(curvnet);
833137628Smlaier	struct in_ifaddr *ia;
834151555Sglebius	struct in_addr prefix, mask, p, m;
835137628Smlaier	int error;
8361541Srgrimes
837170855Smjacob	if ((flags & RTF_HOST) != 0) {
838137628Smlaier		prefix = target->ia_dstaddr.sin_addr;
839170855Smjacob		mask.s_addr = 0;
840170855Smjacob	} else {
841137628Smlaier		prefix = target->ia_addr.sin_addr;
842137628Smlaier		mask = target->ia_sockmask.sin_addr;
843137628Smlaier		prefix.s_addr &= mask.s_addr;
844137628Smlaier	}
845137628Smlaier
846181803Sbz	TAILQ_FOREACH(ia, &V_in_ifaddrhead, ia_link) {
847151555Sglebius		if (rtinitflags(ia)) {
848137628Smlaier			p = ia->ia_addr.sin_addr;
849151555Sglebius
850151555Sglebius			if (prefix.s_addr != p.s_addr)
851151555Sglebius				continue;
852151555Sglebius		} else {
853151555Sglebius			p = ia->ia_addr.sin_addr;
854151555Sglebius			m = ia->ia_sockmask.sin_addr;
855151555Sglebius			p.s_addr &= m.s_addr;
856151555Sglebius
857151555Sglebius			if (prefix.s_addr != p.s_addr ||
858151555Sglebius			    mask.s_addr != m.s_addr)
859151555Sglebius				continue;
860137628Smlaier		}
861137628Smlaier
862137628Smlaier		/*
863137628Smlaier		 * If we got a matching prefix route inserted by other
864137628Smlaier		 * interface address, we are done here.
865137628Smlaier		 */
866149221Sglebius		if (ia->ia_flags & IFA_ROUTE) {
867181803Sbz			if (V_sameprefixcarponly &&
868149221Sglebius			    target->ia_ifp->if_type != IFT_CARP &&
869149221Sglebius			    ia->ia_ifp->if_type != IFT_CARP)
870149221Sglebius				return (EEXIST);
871149221Sglebius			else
872149221Sglebius				return (0);
873149221Sglebius		}
874137628Smlaier	}
875137628Smlaier
876137628Smlaier	/*
877137628Smlaier	 * No-one seem to have this prefix route, so we try to insert it.
878137628Smlaier	 */
879137628Smlaier	error = rtinit(&target->ia_ifa, (int)RTM_ADD, flags);
880137628Smlaier	if (!error)
881137628Smlaier		target->ia_flags |= IFA_ROUTE;
882184295Sbz	return (error);
883137628Smlaier}
884137628Smlaier
885186119Sqingliextern void arp_ifscrub(struct ifnet *ifp, uint32_t addr);
886186119Sqingli
8871541Srgrimes/*
888137628Smlaier * If there is no other address in the system that can serve a route to the
889137628Smlaier * same prefix, remove the route.  Hand over the route to the new address
890137628Smlaier * otherwise.
891137628Smlaier */
892137628Smlaierstatic int
893169454Srwatsonin_scrubprefix(struct in_ifaddr *target)
894137628Smlaier{
895183550Szec	INIT_VNET_INET(curvnet);
896137628Smlaier	struct in_ifaddr *ia;
897137628Smlaier	struct in_addr prefix, mask, p;
898137628Smlaier	int error;
899137628Smlaier
900137628Smlaier	if ((target->ia_flags & IFA_ROUTE) == 0)
901184295Sbz		return (0);
902137628Smlaier
903137628Smlaier	if (rtinitflags(target))
904137628Smlaier		prefix = target->ia_dstaddr.sin_addr;
905137628Smlaier	else {
906137628Smlaier		prefix = target->ia_addr.sin_addr;
907137628Smlaier		mask = target->ia_sockmask.sin_addr;
908137628Smlaier		prefix.s_addr &= mask.s_addr;
909186119Sqingli		/* remove arp cache */
910186119Sqingli		arp_ifscrub(target->ia_ifp, IA_SIN(target)->sin_addr.s_addr);
911137628Smlaier	}
912137628Smlaier
913181803Sbz	TAILQ_FOREACH(ia, &V_in_ifaddrhead, ia_link) {
914137628Smlaier		if (rtinitflags(ia))
915137628Smlaier			p = ia->ia_dstaddr.sin_addr;
916137628Smlaier		else {
917137628Smlaier			p = ia->ia_addr.sin_addr;
918137628Smlaier			p.s_addr &= ia->ia_sockmask.sin_addr.s_addr;
919137628Smlaier		}
920137628Smlaier
921137628Smlaier		if (prefix.s_addr != p.s_addr)
922137628Smlaier			continue;
923137628Smlaier
924137628Smlaier		/*
925137628Smlaier		 * If we got a matching prefix address, move IFA_ROUTE and
926137628Smlaier		 * the route itself to it.  Make sure that routing daemons
927137628Smlaier		 * get a heads-up.
928143868Sglebius		 *
929143868Sglebius		 * XXX: a special case for carp(4) interface
930137628Smlaier		 */
931143868Sglebius		if ((ia->ia_flags & IFA_ROUTE) == 0
932143868Sglebius#ifdef DEV_CARP
933143868Sglebius		    && (ia->ia_ifp->if_type != IFT_CARP)
934143868Sglebius#endif
935143868Sglebius							) {
936137628Smlaier			rtinit(&(target->ia_ifa), (int)RTM_DELETE,
937137628Smlaier			    rtinitflags(target));
938137628Smlaier			target->ia_flags &= ~IFA_ROUTE;
939137628Smlaier
940137628Smlaier			error = rtinit(&ia->ia_ifa, (int)RTM_ADD,
941137628Smlaier			    rtinitflags(ia) | RTF_UP);
942137628Smlaier			if (error == 0)
943137628Smlaier				ia->ia_flags |= IFA_ROUTE;
944184295Sbz			return (error);
945137628Smlaier		}
946137628Smlaier	}
947137628Smlaier
948137628Smlaier	/*
949137628Smlaier	 * As no-one seem to have this prefix, we can remove the route.
950137628Smlaier	 */
951137628Smlaier	rtinit(&(target->ia_ifa), (int)RTM_DELETE, rtinitflags(target));
952137628Smlaier	target->ia_flags &= ~IFA_ROUTE;
953184295Sbz	return (0);
954137628Smlaier}
955137628Smlaier
956137628Smlaier#undef rtinitflags
957137628Smlaier
958137628Smlaier/*
9591541Srgrimes * Return 1 if the address might be a local broadcast address.
9601541Srgrimes */
9611549Srgrimesint
962169454Srwatsonin_broadcast(struct in_addr in, struct ifnet *ifp)
9631541Srgrimes{
9641541Srgrimes	register struct ifaddr *ifa;
9651541Srgrimes	u_long t;
9661541Srgrimes
9671541Srgrimes	if (in.s_addr == INADDR_BROADCAST ||
9681541Srgrimes	    in.s_addr == INADDR_ANY)
969184295Sbz		return (1);
9701541Srgrimes	if ((ifp->if_flags & IFF_BROADCAST) == 0)
971184295Sbz		return (0);
9721541Srgrimes	t = ntohl(in.s_addr);
9731541Srgrimes	/*
9741541Srgrimes	 * Look through the list of addresses for a match
9751541Srgrimes	 * with a broadcast address.
9761541Srgrimes	 */
9771541Srgrimes#define ia ((struct in_ifaddr *)ifa)
97874362Sphk	TAILQ_FOREACH(ifa, &ifp->if_addrhead, ifa_link)
9791541Srgrimes		if (ifa->ifa_addr->sa_family == AF_INET &&
9801541Srgrimes		    (in.s_addr == ia->ia_broadaddr.sin_addr.s_addr ||
9811541Srgrimes		     in.s_addr == ia->ia_netbroadcast.s_addr ||
9821541Srgrimes		     /*
9831541Srgrimes		      * Check for old-style (host 0) broadcast.
9841541Srgrimes		      */
98513351Sguido		     t == ia->ia_subnet || t == ia->ia_net) &&
98613351Sguido		     /*
98713351Sguido		      * Check for an all one subnetmask. These
98813351Sguido		      * only exist when an interface gets a secondary
98913351Sguido		      * address.
99013351Sguido		      */
99113351Sguido		     ia->ia_subnetmask != (u_long)0xffffffff)
992184295Sbz			    return (1);
9931541Srgrimes	return (0);
9941541Srgrimes#undef ia
9951541Srgrimes}
996167729Sbms
9971541Srgrimes/*
998189592Sbms * On interface removal, clean up IPv4 data structures hung off of the ifnet.
999189592Sbms */
1000189592Sbmsvoid
1001189592Sbmsin_ifdetach(struct ifnet *ifp)
1002189592Sbms{
1003189592Sbms	INIT_VNET_INET(ifp->if_vnet);
1004189592Sbms
1005189592Sbms	in_pcbpurgeif0(&V_ripcbinfo, ifp);
1006189592Sbms	in_pcbpurgeif0(&V_udbinfo, ifp);
1007189592Sbms	in_purgemaddrs(ifp);
1008189592Sbms}
1009189592Sbms
1010189592Sbms/*
1011167729Sbms * Delete all IPv4 multicast address records, and associated link-layer
1012167729Sbms * multicast address records, associated with ifp.
1013189592Sbms * XXX It looks like domifdetach runs AFTER the link layer cleanup.
1014189931Sbms * XXX This should not race with ifma_protospec being set during
1015189931Sbms * a new allocation, if it does, we have bigger problems.
1016162718Sbms */
1017167729Sbmsstatic void
1018167729Sbmsin_purgemaddrs(struct ifnet *ifp)
1019162718Sbms{
1020183550Szec	INIT_VNET_INET(ifp->if_vnet);
1021189592Sbms	LIST_HEAD(,in_multi) purgeinms;
1022189592Sbms	struct in_multi		*inm, *tinm;
1023189592Sbms	struct ifmultiaddr	*ifma;
1024162718Sbms
1025189592Sbms	LIST_INIT(&purgeinms);
1026162718Sbms	IN_MULTI_LOCK();
1027189592Sbms
1028189592Sbms	/*
1029189592Sbms	 * Extract list of in_multi associated with the detaching ifp
1030189592Sbms	 * which the PF_INET layer is about to release.
1031189592Sbms	 * We need to do this as IF_ADDR_LOCK() may be re-acquired
1032189592Sbms	 * by code further down.
1033189592Sbms	 */
1034189592Sbms	IF_ADDR_LOCK(ifp);
1035189592Sbms	TAILQ_FOREACH(ifma, &ifp->if_multiaddrs, ifma_link) {
1036189931Sbms		if (ifma->ifma_addr->sa_family != AF_INET ||
1037189931Sbms		    ifma->ifma_protospec == NULL)
1038189592Sbms			continue;
1039189931Sbms#if 0
1040189931Sbms		KASSERT(ifma->ifma_protospec != NULL,
1041189931Sbms		    ("%s: ifma_protospec is NULL", __func__));
1042189931Sbms#endif
1043189592Sbms		inm = (struct in_multi *)ifma->ifma_protospec;
1044189592Sbms		LIST_INSERT_HEAD(&purgeinms, inm, inm_link);
1045162718Sbms	}
1046189592Sbms	IF_ADDR_UNLOCK(ifp);
1047150296Srwatson
1048189592Sbms	LIST_FOREACH_SAFE(inm, &purgeinms, inm_link, tinm) {
1049189592Sbms		inm_release_locked(inm);
1050189592Sbms		LIST_REMOVE(inm, inm_link);
1051189592Sbms	}
1052189592Sbms	igmp_ifdetach(ifp);
1053150296Srwatson
1054189592Sbms	IN_MULTI_UNLOCK();
1055150296Srwatson}
1056186119Sqingli
1057186119Sqingli#include <sys/syslog.h>
1058186119Sqingli#include <net/if_dl.h>
1059186119Sqingli#include <netinet/if_ether.h>
1060186119Sqingli
1061186119Sqinglistruct in_llentry {
1062186119Sqingli	struct llentry		base;
1063186119Sqingli	struct sockaddr_in	l3_addr4;
1064186119Sqingli};
1065186119Sqingli
1066186119Sqinglistatic struct llentry *
1067186119Sqingliin_lltable_new(const struct sockaddr *l3addr, u_int flags)
1068186119Sqingli{
1069186119Sqingli	struct in_llentry *lle;
1070186119Sqingli
1071186119Sqingli	lle = malloc(sizeof(struct in_llentry), M_LLTABLE, M_DONTWAIT | M_ZERO);
1072186119Sqingli	if (lle == NULL)		/* NB: caller generates msg */
1073186119Sqingli		return NULL;
1074186119Sqingli
1075186119Sqingli	callout_init(&lle->base.la_timer, CALLOUT_MPSAFE);
1076186119Sqingli	/*
1077186119Sqingli	 * For IPv4 this will trigger "arpresolve" to generate
1078186119Sqingli	 * an ARP request.
1079186119Sqingli	 */
1080186119Sqingli	lle->base.la_expire = time_second; /* mark expired */
1081186119Sqingli	lle->l3_addr4 = *(const struct sockaddr_in *)l3addr;
1082186119Sqingli	lle->base.lle_refcnt = 1;
1083186119Sqingli	LLE_LOCK_INIT(&lle->base);
1084186119Sqingli	return &lle->base;
1085186119Sqingli}
1086186119Sqingli
1087186119Sqingli/*
1088186119Sqingli * Deletes an address from the address table.
1089186119Sqingli * This function is called by the timer functions
1090186119Sqingli * such as arptimer() and nd6_llinfo_timer(), and
1091186119Sqingli * the caller does the locking.
1092186119Sqingli */
1093186119Sqinglistatic void
1094186119Sqingliin_lltable_free(struct lltable *llt, struct llentry *lle)
1095186119Sqingli{
1096186150Skmacy	LLE_WUNLOCK(lle);
1097186150Skmacy	LLE_LOCK_DESTROY(lle);
1098186119Sqingli	free(lle, M_LLTABLE);
1099186119Sqingli}
1100186119Sqingli
1101186119Sqinglistatic int
1102186119Sqingliin_lltable_rtcheck(struct ifnet *ifp, const struct sockaddr *l3addr)
1103186119Sqingli{
1104186119Sqingli	struct rtentry *rt;
1105186119Sqingli
1106186119Sqingli	KASSERT(l3addr->sa_family == AF_INET,
1107186119Sqingli	    ("sin_family %d", l3addr->sa_family));
1108186119Sqingli
1109186119Sqingli	/* XXX rtalloc1 should take a const param */
1110186119Sqingli	rt = rtalloc1(__DECONST(struct sockaddr *, l3addr), 0, 0);
1111186119Sqingli	if (rt == NULL || (rt->rt_flags & RTF_GATEWAY) || rt->rt_ifp != ifp) {
1112186119Sqingli		log(LOG_INFO, "IPv4 address: \"%s\" is not on the network\n",
1113186119Sqingli		    inet_ntoa(((const struct sockaddr_in *)l3addr)->sin_addr));
1114186119Sqingli		if (rt != NULL)
1115186119Sqingli			RTFREE_LOCKED(rt);
1116186119Sqingli		return (EINVAL);
1117186119Sqingli	}
1118186119Sqingli	RTFREE_LOCKED(rt);
1119186119Sqingli	return 0;
1120186119Sqingli}
1121186119Sqingli
1122186119Sqingli/*
1123186119Sqingli * Return NULL if not found or marked for deletion.
1124186119Sqingli * If found return lle read locked.
1125186119Sqingli */
1126186119Sqinglistatic struct llentry *
1127186119Sqingliin_lltable_lookup(struct lltable *llt, u_int flags, const struct sockaddr *l3addr)
1128186119Sqingli{
1129186119Sqingli	const struct sockaddr_in *sin = (const struct sockaddr_in *)l3addr;
1130186119Sqingli	struct ifnet *ifp = llt->llt_ifp;
1131186119Sqingli	struct llentry *lle;
1132186119Sqingli	struct llentries *lleh;
1133186119Sqingli	u_int hashkey;
1134186119Sqingli
1135186119Sqingli	IF_AFDATA_LOCK_ASSERT(ifp);
1136186119Sqingli	KASSERT(l3addr->sa_family == AF_INET,
1137186119Sqingli	    ("sin_family %d", l3addr->sa_family));
1138186119Sqingli
1139186119Sqingli	hashkey = sin->sin_addr.s_addr;
1140186119Sqingli	lleh = &llt->lle_head[LLATBL_HASH(hashkey, LLTBL_HASHMASK)];
1141186119Sqingli	LIST_FOREACH(lle, lleh, lle_next) {
1142186708Sqingli		struct sockaddr_in *sa2 = (struct sockaddr_in *)L3_ADDR(lle);
1143186119Sqingli		if (lle->la_flags & LLE_DELETED)
1144186119Sqingli			continue;
1145186708Sqingli		if (sa2->sin_addr.s_addr == sin->sin_addr.s_addr)
1146186119Sqingli			break;
1147186119Sqingli	}
1148186119Sqingli	if (lle == NULL) {
1149186119Sqingli#ifdef DIAGNOSTICS
1150186119Sqingli		if (flags & LLE_DELETE)
1151186119Sqingli			log(LOG_INFO, "interface address is missing from cache = %p  in delete\n", lle);
1152186119Sqingli#endif
1153186119Sqingli		if (!(flags & LLE_CREATE))
1154186119Sqingli			return (NULL);
1155186119Sqingli		/*
1156186119Sqingli		 * A route that covers the given address must have
1157186119Sqingli		 * been installed 1st because we are doing a resolution,
1158186119Sqingli		 * verify this.
1159186119Sqingli		 */
1160186119Sqingli		if (!(flags & LLE_IFADDR) &&
1161186119Sqingli		    in_lltable_rtcheck(ifp, l3addr) != 0)
1162186119Sqingli			goto done;
1163186119Sqingli
1164186119Sqingli		lle = in_lltable_new(l3addr, flags);
1165186119Sqingli		if (lle == NULL) {
1166186119Sqingli			log(LOG_INFO, "lla_lookup: new lle malloc failed\n");
1167186119Sqingli			goto done;
1168186119Sqingli		}
1169186119Sqingli		lle->la_flags = flags & ~LLE_CREATE;
1170186119Sqingli		if ((flags & (LLE_CREATE | LLE_IFADDR)) == (LLE_CREATE | LLE_IFADDR)) {
1171186119Sqingli			bcopy(IF_LLADDR(ifp), &lle->ll_addr, ifp->if_addrlen);
1172186119Sqingli			lle->la_flags |= (LLE_VALID | LLE_STATIC);
1173186119Sqingli		}
1174186119Sqingli
1175186119Sqingli		lle->lle_tbl  = llt;
1176186119Sqingli		lle->lle_head = lleh;
1177186119Sqingli		LIST_INSERT_HEAD(lleh, lle, lle_next);
1178186119Sqingli	} else if (flags & LLE_DELETE) {
1179186119Sqingli		if (!(lle->la_flags & LLE_IFADDR) || (flags & LLE_IFADDR)) {
1180186119Sqingli			LLE_WLOCK(lle);
1181186119Sqingli			lle->la_flags = LLE_DELETED;
1182186119Sqingli			LLE_WUNLOCK(lle);
1183186119Sqingli#ifdef DIAGNOSTICS
1184186119Sqingli			log(LOG_INFO, "ifaddr cache = %p  is deleted\n", lle);
1185186119Sqingli#endif
1186186119Sqingli		}
1187186119Sqingli		lle = (void *)-1;
1188186119Sqingli
1189186119Sqingli	}
1190186544Sbz	if (LLE_IS_VALID(lle)) {
1191186119Sqingli		if (flags & LLE_EXCLUSIVE)
1192186119Sqingli			LLE_WLOCK(lle);
1193186119Sqingli		else
1194186119Sqingli			LLE_RLOCK(lle);
1195186119Sqingli	}
1196186119Sqinglidone:
1197186119Sqingli	return (lle);
1198186119Sqingli}
1199186119Sqingli
1200186119Sqinglistatic int
1201186119Sqingliin_lltable_dump(struct lltable *llt, struct sysctl_req *wr)
1202186119Sqingli{
1203186119Sqingli#define	SIN(lle)	((struct sockaddr_in *) L3_ADDR(lle))
1204186119Sqingli	struct ifnet *ifp = llt->llt_ifp;
1205186119Sqingli	struct llentry *lle;
1206186119Sqingli	/* XXX stack use */
1207186119Sqingli	struct {
1208186119Sqingli		struct rt_msghdr	rtm;
1209186119Sqingli		struct sockaddr_inarp	sin;
1210186119Sqingli		struct sockaddr_dl	sdl;
1211186119Sqingli	} arpc;
1212186119Sqingli	int error, i;
1213186119Sqingli
1214186119Sqingli	/* XXXXX
1215186119Sqingli	 * current IFNET_RLOCK() is mapped to IFNET_WLOCK()
1216186119Sqingli	 * so it is okay to use this ASSERT, change it when
1217186119Sqingli	 * IFNET lock is finalized
1218186119Sqingli	 */
1219186119Sqingli	IFNET_WLOCK_ASSERT();
1220186119Sqingli
1221186119Sqingli	error = 0;
1222186119Sqingli	for (i = 0; i < LLTBL_HASHTBL_SIZE; i++) {
1223186119Sqingli		LIST_FOREACH(lle, &llt->lle_head[i], lle_next) {
1224186119Sqingli			struct sockaddr_dl *sdl;
1225186119Sqingli
1226186119Sqingli			/* skip deleted entries */
1227186119Sqingli			if ((lle->la_flags & (LLE_DELETED|LLE_VALID)) != LLE_VALID)
1228186119Sqingli				continue;
1229186980Sbz			/* Skip if jailed and not a valid IP of the prison. */
1230188144Sjamie			if (prison_if(wr->td->td_ucred, L3_ADDR(lle)) != 0)
1231186980Sbz				continue;
1232186119Sqingli			/*
1233186119Sqingli			 * produce a msg made of:
1234186119Sqingli			 *  struct rt_msghdr;
1235186119Sqingli			 *  struct sockaddr_inarp; (IPv4)
1236186119Sqingli			 *  struct sockaddr_dl;
1237186119Sqingli			 */
1238186119Sqingli			bzero(&arpc, sizeof(arpc));
1239186119Sqingli			arpc.rtm.rtm_msglen = sizeof(arpc);
1240186935Sharti			arpc.rtm.rtm_version = RTM_VERSION;
1241186935Sharti			arpc.rtm.rtm_type = RTM_GET;
1242186935Sharti			arpc.rtm.rtm_flags = RTF_UP;
1243186935Sharti			arpc.rtm.rtm_addrs = RTA_DST | RTA_GATEWAY;
1244186119Sqingli			arpc.sin.sin_family = AF_INET;
1245186119Sqingli			arpc.sin.sin_len = sizeof(arpc.sin);
1246186119Sqingli			arpc.sin.sin_addr.s_addr = SIN(lle)->sin_addr.s_addr;
1247186119Sqingli
1248186119Sqingli			/* publish */
1249186119Sqingli			if (lle->la_flags & LLE_PUB) {
1250186119Sqingli				arpc.rtm.rtm_flags |= RTF_ANNOUNCE;
1251186119Sqingli				/* proxy only */
1252186119Sqingli				if (lle->la_flags & LLE_PROXY)
1253186119Sqingli					arpc.sin.sin_other = SIN_PROXY;
1254186119Sqingli			}
1255186119Sqingli
1256186119Sqingli			sdl = &arpc.sdl;
1257186119Sqingli			sdl->sdl_family = AF_LINK;
1258186119Sqingli			sdl->sdl_len = sizeof(*sdl);
1259186119Sqingli			sdl->sdl_alen = ifp->if_addrlen;
1260186119Sqingli			sdl->sdl_index = ifp->if_index;
1261186119Sqingli			sdl->sdl_type = ifp->if_type;
1262186119Sqingli			bcopy(&lle->ll_addr, LLADDR(sdl), ifp->if_addrlen);
1263186119Sqingli
1264186119Sqingli			arpc.rtm.rtm_rmx.rmx_expire =
1265186119Sqingli			    lle->la_flags & LLE_STATIC ? 0 : lle->la_expire;
1266186500Sqingli			arpc.rtm.rtm_flags |= (RTF_HOST | RTF_LLDATA);
1267186119Sqingli			if (lle->la_flags & LLE_STATIC)
1268186119Sqingli				arpc.rtm.rtm_flags |= RTF_STATIC;
1269186119Sqingli			arpc.rtm.rtm_index = ifp->if_index;
1270186119Sqingli			error = SYSCTL_OUT(wr, &arpc, sizeof(arpc));
1271186119Sqingli			if (error)
1272186119Sqingli				break;
1273186119Sqingli		}
1274186119Sqingli	}
1275186119Sqingli	return error;
1276186119Sqingli#undef SIN
1277186119Sqingli}
1278186119Sqingli
1279186119Sqinglivoid *
1280186119Sqingliin_domifattach(struct ifnet *ifp)
1281189592Sbms{
1282189592Sbms	struct in_ifinfo *ii;
1283189592Sbms	struct lltable *llt;
1284189592Sbms
1285189592Sbms	ii = malloc(sizeof(struct in_ifinfo), M_IFADDR, M_WAITOK|M_ZERO);
1286189592Sbms
1287189592Sbms	llt = lltable_init(ifp, AF_INET);
1288186119Sqingli	if (llt != NULL) {
1289186119Sqingli		llt->llt_new = in_lltable_new;
1290186119Sqingli		llt->llt_free = in_lltable_free;
1291186119Sqingli		llt->llt_rtcheck = in_lltable_rtcheck;
1292186119Sqingli		llt->llt_lookup = in_lltable_lookup;
1293186119Sqingli		llt->llt_dump = in_lltable_dump;
1294186119Sqingli	}
1295189592Sbms	ii->ii_llt = llt;
1296189592Sbms
1297189592Sbms	ii->ii_igmp = igmp_domifattach(ifp);
1298189592Sbms
1299189592Sbms	return ii;
1300186119Sqingli}
1301186119Sqingli
1302186119Sqinglivoid
1303189592Sbmsin_domifdetach(struct ifnet *ifp, void *aux)
1304186119Sqingli{
1305189592Sbms	struct in_ifinfo *ii = (struct in_ifinfo *)aux;
1306186119Sqingli
1307189592Sbms	igmp_domifdetach(ifp);
1308189592Sbms	lltable_free(ii->ii_llt);
1309189592Sbms	free(ii, M_IFADDR);
1310186119Sqingli}
1311