in.c revision 188144
1139823Simp/*-
21541Srgrimes * Copyright (c) 1982, 1986, 1991, 1993
31541Srgrimes *	The Regents of the University of California.  All rights reserved.
4137668Smlaier * Copyright (C) 2001 WIDE Project.  All rights reserved.
51541Srgrimes *
61541Srgrimes * Redistribution and use in source and binary forms, with or without
71541Srgrimes * modification, are permitted provided that the following conditions
81541Srgrimes * are met:
91541Srgrimes * 1. Redistributions of source code must retain the above copyright
101541Srgrimes *    notice, this list of conditions and the following disclaimer.
111541Srgrimes * 2. Redistributions in binary form must reproduce the above copyright
121541Srgrimes *    notice, this list of conditions and the following disclaimer in the
131541Srgrimes *    documentation and/or other materials provided with the distribution.
141541Srgrimes * 4. Neither the name of the University nor the names of its contributors
151541Srgrimes *    may be used to endorse or promote products derived from this software
161541Srgrimes *    without specific prior written permission.
171541Srgrimes *
181541Srgrimes * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
191541Srgrimes * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
201541Srgrimes * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
211541Srgrimes * ARE DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
221541Srgrimes * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
231541Srgrimes * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
241541Srgrimes * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
251541Srgrimes * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
261541Srgrimes * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
271541Srgrimes * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
281541Srgrimes * SUCH DAMAGE.
291541Srgrimes *
3010939Swollman *	@(#)in.c	8.4 (Berkeley) 1/9/95
311541Srgrimes */
321541Srgrimes
33172467Ssilby#include <sys/cdefs.h>
34172467Ssilby__FBSDID("$FreeBSD: head/sys/netinet/in.c 188144 2009-02-05 14:06:09Z jamie $");
35172467Ssilby
36143868Sglebius#include "opt_carp.h"
37143868Sglebius
381541Srgrimes#include <sys/param.h>
391549Srgrimes#include <sys/systm.h>
4024204Sbde#include <sys/sockio.h>
411541Srgrimes#include <sys/malloc.h>
42164033Srwatson#include <sys/priv.h>
431541Srgrimes#include <sys/socket.h>
44186948Sbz#include <sys/jail.h>
4512704Sphk#include <sys/kernel.h>
46186948Sbz#include <sys/proc.h>
4712704Sphk#include <sys/sysctl.h>
48181803Sbz#include <sys/vimage.h>
491541Srgrimes
501541Srgrimes#include <net/if.h>
51186119Sqingli#include <net/if_llatbl.h>
5255009Sshin#include <net/if_types.h>
531541Srgrimes#include <net/route.h>
541541Srgrimes
551541Srgrimes#include <netinet/in.h>
561541Srgrimes#include <netinet/in_var.h>
5781127Sume#include <netinet/in_pcb.h>
58170613Sbms#include <netinet/ip_var.h>
59185571Sbz#include <netinet/vinet.h>
601541Srgrimes
6192723Salfredstatic int in_mask2len(struct in_addr *);
6292723Salfredstatic void in_len2mask(struct in_addr *, int);
6392723Salfredstatic int in_lifaddr_ioctl(struct socket *, u_long, caddr_t,
6492723Salfred	struct ifnet *, struct thread *);
6555009Sshin
66137628Smlaierstatic int	in_addprefix(struct in_ifaddr *, int);
67137628Smlaierstatic int	in_scrubprefix(struct in_ifaddr *);
6892723Salfredstatic void	in_socktrim(struct sockaddr_in *);
6992723Salfredstatic int	in_ifinit(struct ifnet *,
7092723Salfred	    struct in_ifaddr *, struct sockaddr_in *, int);
71167729Sbmsstatic void	in_purgemaddrs(struct ifnet *);
721541Srgrimes
73185088Szec#ifdef VIMAGE_GLOBALS
74185088Szecstatic int subnetsarelocal;
75185088Szecstatic int sameprefixcarponly;
76185088Szecextern struct inpcbinfo ripcbinfo;
77185088Szec#endif
78185088Szec
79183550SzecSYSCTL_V_INT(V_NET, vnet_inet, _net_inet_ip, OID_AUTO, subnets_are_local,
80183550Szec	CTLFLAG_RW, subnetsarelocal, 0,
81183550Szec	"Treat all subnets as directly connected");
82183550SzecSYSCTL_V_INT(V_NET, vnet_inet, _net_inet_ip, OID_AUTO, same_prefix_carp_only,
83183550Szec	CTLFLAG_RW, sameprefixcarponly, 0,
84149221Sglebius	"Refuse to create same prefixes on different interfaces");
8521666Swollman
861541Srgrimes/*
871541Srgrimes * Return 1 if an internet address is for a ``local'' host
881541Srgrimes * (one to which we have a connection).  If subnetsarelocal
891541Srgrimes * is true, this includes other subnets of the local net.
901541Srgrimes * Otherwise, it includes only the directly-connected (sub)nets.
911541Srgrimes */
921549Srgrimesint
93169454Srwatsonin_localaddr(struct in_addr in)
941541Srgrimes{
95183550Szec	INIT_VNET_INET(curvnet);
961541Srgrimes	register u_long i = ntohl(in.s_addr);
971541Srgrimes	register struct in_ifaddr *ia;
981541Srgrimes
99181803Sbz	if (V_subnetsarelocal) {
100181803Sbz		TAILQ_FOREACH(ia, &V_in_ifaddrhead, ia_link)
1011541Srgrimes			if ((i & ia->ia_netmask) == ia->ia_net)
1021541Srgrimes				return (1);
1031541Srgrimes	} else {
104181803Sbz		TAILQ_FOREACH(ia, &V_in_ifaddrhead, ia_link)
1051541Srgrimes			if ((i & ia->ia_subnetmask) == ia->ia_subnet)
1061541Srgrimes				return (1);
1071541Srgrimes	}
1081541Srgrimes	return (0);
1091541Srgrimes}
1101541Srgrimes
1111541Srgrimes/*
112133486Sandre * Return 1 if an internet address is for the local host and configured
113133486Sandre * on one of its interfaces.
114133486Sandre */
115133486Sandreint
116169454Srwatsonin_localip(struct in_addr in)
117133486Sandre{
118183550Szec	INIT_VNET_INET(curvnet);
119133486Sandre	struct in_ifaddr *ia;
120133486Sandre
121133486Sandre	LIST_FOREACH(ia, INADDR_HASH(in.s_addr), ia_hash) {
122133486Sandre		if (IA_SIN(ia)->sin_addr.s_addr == in.s_addr)
123184295Sbz			return (1);
124133486Sandre	}
125184295Sbz	return (0);
126133486Sandre}
127133486Sandre
128133486Sandre/*
1291541Srgrimes * Determine whether an IP address is in a reserved set of addresses
1301541Srgrimes * that may not be forwarded, or whether datagrams to that destination
1311541Srgrimes * may be forwarded.
1321541Srgrimes */
1331549Srgrimesint
134169454Srwatsonin_canforward(struct in_addr in)
1351541Srgrimes{
1361541Srgrimes	register u_long i = ntohl(in.s_addr);
1371541Srgrimes	register u_long net;
1381541Srgrimes
139166450Sbms	if (IN_EXPERIMENTAL(i) || IN_MULTICAST(i) || IN_LINKLOCAL(i))
1401541Srgrimes		return (0);
1411541Srgrimes	if (IN_CLASSA(i)) {
1421541Srgrimes		net = i & IN_CLASSA_NET;
1431541Srgrimes		if (net == 0 || net == (IN_LOOPBACKNET << IN_CLASSA_NSHIFT))
1441541Srgrimes			return (0);
1451541Srgrimes	}
1461541Srgrimes	return (1);
1471541Srgrimes}
1481541Srgrimes
1491541Srgrimes/*
1501541Srgrimes * Trim a mask in a sockaddr
1511541Srgrimes */
15212296Sphkstatic void
153169454Srwatsonin_socktrim(struct sockaddr_in *ap)
1541541Srgrimes{
1551541Srgrimes    register char *cplim = (char *) &ap->sin_addr;
1561541Srgrimes    register char *cp = (char *) (&ap->sin_addr + 1);
1571541Srgrimes
1581541Srgrimes    ap->sin_len = 0;
1594127Swollman    while (--cp >= cplim)
160133874Srwatson	if (*cp) {
1611541Srgrimes	    (ap)->sin_len = cp - (char *) (ap) + 1;
1621541Srgrimes	    break;
1631541Srgrimes	}
1641541Srgrimes}
1651541Srgrimes
16655009Sshinstatic int
16755009Sshinin_mask2len(mask)
16855009Sshin	struct in_addr *mask;
16955009Sshin{
17055009Sshin	int x, y;
17155009Sshin	u_char *p;
17255009Sshin
17355009Sshin	p = (u_char *)mask;
17455009Sshin	for (x = 0; x < sizeof(*mask); x++) {
17555009Sshin		if (p[x] != 0xff)
17655009Sshin			break;
17755009Sshin	}
17855009Sshin	y = 0;
17955009Sshin	if (x < sizeof(*mask)) {
18055009Sshin		for (y = 0; y < 8; y++) {
18155009Sshin			if ((p[x] & (0x80 >> y)) == 0)
18255009Sshin				break;
18355009Sshin		}
18455009Sshin	}
185184295Sbz	return (x * 8 + y);
18655009Sshin}
18755009Sshin
18855009Sshinstatic void
189169454Srwatsonin_len2mask(struct in_addr *mask, int len)
19055009Sshin{
19155009Sshin	int i;
19255009Sshin	u_char *p;
19355009Sshin
19455009Sshin	p = (u_char *)mask;
19555009Sshin	bzero(mask, sizeof(*mask));
19655009Sshin	for (i = 0; i < len / 8; i++)
19755009Sshin		p[i] = 0xff;
19855009Sshin	if (len % 8)
19955009Sshin		p[i] = (0xff00 >> (len % 8)) & 0xff;
20055009Sshin}
20155009Sshin
2021541Srgrimes/*
2031541Srgrimes * Generic internet control operations (ioctl's).
2041541Srgrimes * Ifp is 0 if not an interface-specific ioctl.
2051541Srgrimes */
2061541Srgrimes/* ARGSUSED */
2071549Srgrimesint
208169454Srwatsonin_control(struct socket *so, u_long cmd, caddr_t data, struct ifnet *ifp,
209169454Srwatson    struct thread *td)
2101541Srgrimes{
211183550Szec	INIT_VNET_INET(curvnet); /* both so and ifp can be NULL here! */
2121541Srgrimes	register struct ifreq *ifr = (struct ifreq *)data;
213184295Sbz	register struct in_ifaddr *ia, *iap;
2141541Srgrimes	register struct ifaddr *ifa;
215168032Sbms	struct in_addr allhosts_addr;
21684102Sjlemon	struct in_addr dst;
2171541Srgrimes	struct in_ifaddr *oia;
2181541Srgrimes	struct in_aliasreq *ifra = (struct in_aliasreq *)data;
2191541Srgrimes	struct sockaddr_in oldaddr;
22087124Sbrian	int error, hostIsNew, iaIsNew, maskIsNew, s;
221168032Sbms	int iaIsFirst;
2221541Srgrimes
223184295Sbz	ia = NULL;
224168032Sbms	iaIsFirst = 0;
22587124Sbrian	iaIsNew = 0;
226168032Sbms	allhosts_addr.s_addr = htonl(INADDR_ALLHOSTS_GROUP);
22787124Sbrian
22855009Sshin	switch (cmd) {
22955009Sshin	case SIOCALIFADDR:
230164033Srwatson		if (td != NULL) {
231164033Srwatson			error = priv_check(td, PRIV_NET_ADDIFADDR);
232164033Srwatson			if (error)
233164033Srwatson				return (error);
234164033Srwatson		}
235184295Sbz		if (ifp == NULL)
236184295Sbz			return (EINVAL);
237164033Srwatson		return in_lifaddr_ioctl(so, cmd, data, ifp, td);
238164033Srwatson
23955009Sshin	case SIOCDLIFADDR:
240164033Srwatson		if (td != NULL) {
241164033Srwatson			error = priv_check(td, PRIV_NET_DELIFADDR);
242164033Srwatson			if (error)
243164033Srwatson				return (error);
244164033Srwatson		}
245184295Sbz		if (ifp == NULL)
246184295Sbz			return (EINVAL);
247164033Srwatson		return in_lifaddr_ioctl(so, cmd, data, ifp, td);
248164033Srwatson
24955009Sshin	case SIOCGLIFADDR:
250184295Sbz		if (ifp == NULL)
251184295Sbz			return (EINVAL);
25283366Sjulian		return in_lifaddr_ioctl(so, cmd, data, ifp, td);
25355009Sshin	}
25455009Sshin
2551541Srgrimes	/*
2561541Srgrimes	 * Find address for this interface, if it exists.
25714632Sfenner	 *
25814632Sfenner	 * If an alias address was specified, find that one instead of
25984102Sjlemon	 * the first one on the interface, if possible.
2601541Srgrimes	 */
261184295Sbz	if (ifp != NULL) {
26284102Sjlemon		dst = ((struct sockaddr_in *)&ifr->ifr_addr)->sin_addr;
26384102Sjlemon		LIST_FOREACH(iap, INADDR_HASH(dst.s_addr), ia_hash)
26484102Sjlemon			if (iap->ia_ifp == ifp &&
26584102Sjlemon			    iap->ia_addr.sin_addr.s_addr == dst.s_addr) {
266186948Sbz				if (td == NULL || prison_check_ip4(
267188144Sjamie				    td->td_ucred, &dst) == 0)
268186948Sbz					ia = iap;
26984102Sjlemon				break;
27084102Sjlemon			}
27184102Sjlemon		if (ia == NULL)
27284102Sjlemon			TAILQ_FOREACH(ifa, &ifp->if_addrhead, ifa_link) {
27384102Sjlemon				iap = ifatoia(ifa);
27484102Sjlemon				if (iap->ia_addr.sin_family == AF_INET) {
275186948Sbz					if (td != NULL &&
276188144Sjamie					    prison_check_ip4(td->td_ucred,
277188144Sjamie					    &iap->ia_addr.sin_addr) != 0)
278186948Sbz						continue;
27914632Sfenner					ia = iap;
28014632Sfenner					break;
28114632Sfenner				}
28214632Sfenner			}
283168032Sbms		if (ia == NULL)
284168032Sbms			iaIsFirst = 1;
28584102Sjlemon	}
2861541Srgrimes
2871541Srgrimes	switch (cmd) {
2881541Srgrimes
2891541Srgrimes	case SIOCAIFADDR:
2901541Srgrimes	case SIOCDIFADDR:
291184295Sbz		if (ifp == NULL)
29241575Seivind			return (EADDRNOTAVAIL);
2938071Swollman		if (ifra->ifra_addr.sin_family == AF_INET) {
29471999Sphk			for (oia = ia; ia; ia = TAILQ_NEXT(ia, ia_link)) {
2958071Swollman				if (ia->ia_ifp == ifp  &&
2968071Swollman				    ia->ia_addr.sin_addr.s_addr ==
2978071Swollman				    ifra->ifra_addr.sin_addr.s_addr)
2988071Swollman					break;
2998071Swollman			}
3008876Srgrimes			if ((ifp->if_flags & IFF_POINTOPOINT)
3018071Swollman			    && (cmd == SIOCAIFADDR)
3028071Swollman			    && (ifra->ifra_dstaddr.sin_addr.s_addr
3038071Swollman				== INADDR_ANY)) {
304184295Sbz				return (EDESTADDRREQ);
3058071Swollman			}
3061541Srgrimes		}
307184295Sbz		if (cmd == SIOCDIFADDR && ia == NULL)
3081541Srgrimes			return (EADDRNOTAVAIL);
3091541Srgrimes		/* FALLTHROUGH */
3101541Srgrimes	case SIOCSIFADDR:
3111541Srgrimes	case SIOCSIFNETMASK:
3121541Srgrimes	case SIOCSIFDSTADDR:
313164033Srwatson		if (td != NULL) {
314175626Sbz			error = priv_check(td, (cmd == SIOCDIFADDR) ?
315175626Sbz			    PRIV_NET_DELIFADDR : PRIV_NET_ADDIFADDR);
316164033Srwatson			if (error)
317164033Srwatson				return (error);
318164033Srwatson		}
3191541Srgrimes
320184295Sbz		if (ifp == NULL)
32141575Seivind			return (EADDRNOTAVAIL);
322184295Sbz		if (ia == NULL) {
32320407Swollman			ia = (struct in_ifaddr *)
324111119Simp				malloc(sizeof *ia, M_IFADDR, M_WAITOK | M_ZERO);
325184295Sbz			if (ia == NULL)
3261541Srgrimes				return (ENOBUFS);
32715092Sdg			/*
32815092Sdg			 * Protect from ipintr() traversing address list
32915092Sdg			 * while we're modifying it.
33015092Sdg			 */
33115092Sdg			s = splnet();
33220407Swollman			ifa = &ia->ia_ifa;
333108033Shsu			IFA_LOCK_INIT(ifa);
33420407Swollman			ifa->ifa_addr = (struct sockaddr *)&ia->ia_addr;
33520407Swollman			ifa->ifa_dstaddr = (struct sockaddr *)&ia->ia_dstaddr;
33620407Swollman			ifa->ifa_netmask = (struct sockaddr *)&ia->ia_sockmask;
337108033Shsu			ifa->ifa_refcnt = 1;
338108033Shsu			TAILQ_INSERT_TAIL(&ifp->if_addrhead, ifa, ifa_link);
339108033Shsu
3401541Srgrimes			ia->ia_sockmask.sin_len = 8;
34185740Sdes			ia->ia_sockmask.sin_family = AF_INET;
3421541Srgrimes			if (ifp->if_flags & IFF_BROADCAST) {
3431541Srgrimes				ia->ia_broadaddr.sin_len = sizeof(ia->ia_addr);
3441541Srgrimes				ia->ia_broadaddr.sin_family = AF_INET;
3451541Srgrimes			}
3461541Srgrimes			ia->ia_ifp = ifp;
347151824Sglebius
348181803Sbz			TAILQ_INSERT_TAIL(&V_in_ifaddrhead, ia, ia_link);
34915092Sdg			splx(s);
35087124Sbrian			iaIsNew = 1;
3511541Srgrimes		}
3521541Srgrimes		break;
3531541Srgrimes
3541541Srgrimes	case SIOCSIFBRDADDR:
355164033Srwatson		if (td != NULL) {
356164033Srwatson			error = priv_check(td, PRIV_NET_ADDIFADDR);
357164033Srwatson			if (error)
358164033Srwatson				return (error);
359164033Srwatson		}
3601541Srgrimes		/* FALLTHROUGH */
3611541Srgrimes
3621541Srgrimes	case SIOCGIFADDR:
3631541Srgrimes	case SIOCGIFNETMASK:
3641541Srgrimes	case SIOCGIFDSTADDR:
3651541Srgrimes	case SIOCGIFBRDADDR:
366184295Sbz		if (ia == NULL)
3671541Srgrimes			return (EADDRNOTAVAIL);
3681541Srgrimes		break;
3691541Srgrimes	}
3701541Srgrimes	switch (cmd) {
3711541Srgrimes
3721541Srgrimes	case SIOCGIFADDR:
3731541Srgrimes		*((struct sockaddr_in *)&ifr->ifr_addr) = ia->ia_addr;
37487124Sbrian		return (0);
3751541Srgrimes
3761541Srgrimes	case SIOCGIFBRDADDR:
3771541Srgrimes		if ((ifp->if_flags & IFF_BROADCAST) == 0)
3781541Srgrimes			return (EINVAL);
3791541Srgrimes		*((struct sockaddr_in *)&ifr->ifr_dstaddr) = ia->ia_broadaddr;
38087124Sbrian		return (0);
3811541Srgrimes
3821541Srgrimes	case SIOCGIFDSTADDR:
3831541Srgrimes		if ((ifp->if_flags & IFF_POINTOPOINT) == 0)
3841541Srgrimes			return (EINVAL);
3851541Srgrimes		*((struct sockaddr_in *)&ifr->ifr_dstaddr) = ia->ia_dstaddr;
38687124Sbrian		return (0);
3871541Srgrimes
3881541Srgrimes	case SIOCGIFNETMASK:
3891541Srgrimes		*((struct sockaddr_in *)&ifr->ifr_addr) = ia->ia_sockmask;
39087124Sbrian		return (0);
3911541Srgrimes
3921541Srgrimes	case SIOCSIFDSTADDR:
3931541Srgrimes		if ((ifp->if_flags & IFF_POINTOPOINT) == 0)
3941541Srgrimes			return (EINVAL);
3951541Srgrimes		oldaddr = ia->ia_dstaddr;
3961541Srgrimes		ia->ia_dstaddr = *(struct sockaddr_in *)&ifr->ifr_dstaddr;
397184295Sbz		if (ifp->if_ioctl != NULL) {
398146883Siedowse			IFF_LOCKGIANT(ifp);
399146883Siedowse			error = (*ifp->if_ioctl)(ifp, SIOCSIFDSTADDR,
400146883Siedowse			    (caddr_t)ia);
401146883Siedowse			IFF_UNLOCKGIANT(ifp);
402146883Siedowse			if (error) {
403146883Siedowse				ia->ia_dstaddr = oldaddr;
404146883Siedowse				return (error);
405146883Siedowse			}
4061541Srgrimes		}
4071541Srgrimes		if (ia->ia_flags & IFA_ROUTE) {
4081541Srgrimes			ia->ia_ifa.ifa_dstaddr = (struct sockaddr *)&oldaddr;
4091541Srgrimes			rtinit(&(ia->ia_ifa), (int)RTM_DELETE, RTF_HOST);
4101541Srgrimes			ia->ia_ifa.ifa_dstaddr =
4111541Srgrimes					(struct sockaddr *)&ia->ia_dstaddr;
4121541Srgrimes			rtinit(&(ia->ia_ifa), (int)RTM_ADD, RTF_HOST|RTF_UP);
4131541Srgrimes		}
41487124Sbrian		return (0);
4151541Srgrimes
4161541Srgrimes	case SIOCSIFBRDADDR:
4171541Srgrimes		if ((ifp->if_flags & IFF_BROADCAST) == 0)
4181541Srgrimes			return (EINVAL);
4191541Srgrimes		ia->ia_broadaddr = *(struct sockaddr_in *)&ifr->ifr_broadaddr;
42087124Sbrian		return (0);
4211541Srgrimes
4221541Srgrimes	case SIOCSIFADDR:
42387124Sbrian		error = in_ifinit(ifp, ia,
42487124Sbrian		    (struct sockaddr_in *) &ifr->ifr_addr, 1);
42587124Sbrian		if (error != 0 && iaIsNew)
42687124Sbrian			break;
427168032Sbms		if (error == 0) {
428168032Sbms			if (iaIsFirst && (ifp->if_flags & IFF_MULTICAST) != 0)
429168032Sbms				in_addmulti(&allhosts_addr, ifp);
430126264Smlaier			EVENTHANDLER_INVOKE(ifaddr_event, ifp);
431168032Sbms		}
43287124Sbrian		return (0);
4331541Srgrimes
4341541Srgrimes	case SIOCSIFNETMASK:
43585740Sdes		ia->ia_sockmask.sin_addr = ifra->ifra_addr.sin_addr;
43685740Sdes		ia->ia_subnetmask = ntohl(ia->ia_sockmask.sin_addr.s_addr);
43787124Sbrian		return (0);
4381541Srgrimes
4391541Srgrimes	case SIOCAIFADDR:
4401541Srgrimes		maskIsNew = 0;
4411541Srgrimes		hostIsNew = 1;
4421541Srgrimes		error = 0;
4431541Srgrimes		if (ia->ia_addr.sin_family == AF_INET) {
4441541Srgrimes			if (ifra->ifra_addr.sin_len == 0) {
4451541Srgrimes				ifra->ifra_addr = ia->ia_addr;
4461541Srgrimes				hostIsNew = 0;
4471541Srgrimes			} else if (ifra->ifra_addr.sin_addr.s_addr ==
4481541Srgrimes					       ia->ia_addr.sin_addr.s_addr)
4491541Srgrimes				hostIsNew = 0;
4501541Srgrimes		}
4511541Srgrimes		if (ifra->ifra_mask.sin_len) {
4521541Srgrimes			in_ifscrub(ifp, ia);
4531541Srgrimes			ia->ia_sockmask = ifra->ifra_mask;
45485740Sdes			ia->ia_sockmask.sin_family = AF_INET;
4551541Srgrimes			ia->ia_subnetmask =
4561541Srgrimes			     ntohl(ia->ia_sockmask.sin_addr.s_addr);
4571541Srgrimes			maskIsNew = 1;
4581541Srgrimes		}
4591541Srgrimes		if ((ifp->if_flags & IFF_POINTOPOINT) &&
4601541Srgrimes		    (ifra->ifra_dstaddr.sin_family == AF_INET)) {
4611541Srgrimes			in_ifscrub(ifp, ia);
4621541Srgrimes			ia->ia_dstaddr = ifra->ifra_dstaddr;
4631541Srgrimes			maskIsNew  = 1; /* We lie; but the effect's the same */
4641541Srgrimes		}
4651541Srgrimes		if (ifra->ifra_addr.sin_family == AF_INET &&
4661541Srgrimes		    (hostIsNew || maskIsNew))
4671541Srgrimes			error = in_ifinit(ifp, ia, &ifra->ifra_addr, 0);
46887124Sbrian		if (error != 0 && iaIsNew)
46987124Sbrian			break;
47087124Sbrian
4711541Srgrimes		if ((ifp->if_flags & IFF_BROADCAST) &&
4721541Srgrimes		    (ifra->ifra_broadaddr.sin_family == AF_INET))
4731541Srgrimes			ia->ia_broadaddr = ifra->ifra_broadaddr;
474168032Sbms		if (error == 0) {
475168032Sbms			if (iaIsFirst && (ifp->if_flags & IFF_MULTICAST) != 0)
476168032Sbms				in_addmulti(&allhosts_addr, ifp);
477126264Smlaier			EVENTHANDLER_INVOKE(ifaddr_event, ifp);
478168032Sbms		}
4791541Srgrimes		return (error);
4801541Srgrimes
4811541Srgrimes	case SIOCDIFADDR:
48274299Sru		/*
48374299Sru		 * in_ifscrub kills the interface route.
48474299Sru		 */
4851541Srgrimes		in_ifscrub(ifp, ia);
48615092Sdg		/*
48774299Sru		 * in_ifadown gets rid of all the rest of
48874299Sru		 * the routes.  This is not quite the right
48974299Sru		 * thing to do, but at least if we are running
49074299Sru		 * a routing process they will come back.
49174299Sru		 */
49276469Sru		in_ifadown(&ia->ia_ifa, 1);
493126264Smlaier		EVENTHANDLER_INVOKE(ifaddr_event, ifp);
49487124Sbrian		error = 0;
4951541Srgrimes		break;
4961541Srgrimes
4971541Srgrimes	default:
498184295Sbz		if (ifp == NULL || ifp->if_ioctl == NULL)
4991541Srgrimes			return (EOPNOTSUPP);
500146883Siedowse		IFF_LOCKGIANT(ifp);
501146883Siedowse		error = (*ifp->if_ioctl)(ifp, cmd, data);
502146883Siedowse		IFF_UNLOCKGIANT(ifp);
503146883Siedowse		return (error);
5041541Srgrimes	}
50587124Sbrian
50687124Sbrian	/*
50787124Sbrian	 * Protect from ipintr() traversing address list while we're modifying
50887124Sbrian	 * it.
50987124Sbrian	 */
51087124Sbrian	s = splnet();
51187124Sbrian	TAILQ_REMOVE(&ifp->if_addrhead, &ia->ia_ifa, ifa_link);
512181803Sbz	TAILQ_REMOVE(&V_in_ifaddrhead, ia, ia_link);
513168032Sbms	if (ia->ia_addr.sin_family == AF_INET) {
514154777Sandre		LIST_REMOVE(ia, ia_hash);
515168032Sbms		/*
516168032Sbms		 * If this is the last IPv4 address configured on this
517168032Sbms		 * interface, leave the all-hosts group.
518168032Sbms		 * XXX: This is quite ugly because of locking and structure.
519168032Sbms		 */
520168032Sbms		oia = NULL;
521168032Sbms		IFP_TO_IA(ifp, oia);
522168032Sbms		if (oia == NULL) {
523168032Sbms			struct in_multi *inm;
524168032Sbms
525168032Sbms			IFF_LOCKGIANT(ifp);
526168032Sbms			IN_MULTI_LOCK();
527168032Sbms			IN_LOOKUP_MULTI(allhosts_addr, ifp, inm);
528168032Sbms			if (inm != NULL)
529168032Sbms				in_delmulti_locked(inm);
530168032Sbms			IN_MULTI_UNLOCK();
531168032Sbms			IFF_UNLOCKGIANT(ifp);
532168032Sbms		}
533168032Sbms	}
53487124Sbrian	IFAFREE(&ia->ia_ifa);
53587124Sbrian	splx(s);
53687124Sbrian
53787124Sbrian	return (error);
5381541Srgrimes}
5391541Srgrimes
5401541Srgrimes/*
54155009Sshin * SIOC[GAD]LIFADDR.
54255009Sshin *	SIOCGLIFADDR: get first address. (?!?)
54355009Sshin *	SIOCGLIFADDR with IFLR_PREFIX:
54455009Sshin *		get first address that matches the specified prefix.
54555009Sshin *	SIOCALIFADDR: add the specified address.
54655009Sshin *	SIOCALIFADDR with IFLR_PREFIX:
54755009Sshin *		EINVAL since we can't deduce hostid part of the address.
54855009Sshin *	SIOCDLIFADDR: delete the specified address.
54955009Sshin *	SIOCDLIFADDR with IFLR_PREFIX:
55055009Sshin *		delete the first address that matches the specified prefix.
55155009Sshin * return values:
55255009Sshin *	EINVAL on invalid parameters
55355009Sshin *	EADDRNOTAVAIL on prefix match failed/specified address not found
55455009Sshin *	other values may be returned from in_ioctl()
55555009Sshin */
55655009Sshinstatic int
557169454Srwatsonin_lifaddr_ioctl(struct socket *so, u_long cmd, caddr_t data,
558169454Srwatson    struct ifnet *ifp, struct thread *td)
55955009Sshin{
56055009Sshin	struct if_laddrreq *iflr = (struct if_laddrreq *)data;
56155009Sshin	struct ifaddr *ifa;
56255009Sshin
56355009Sshin	/* sanity checks */
564184295Sbz	if (data == NULL || ifp == NULL) {
56555009Sshin		panic("invalid argument to in_lifaddr_ioctl");
56655009Sshin		/*NOTRECHED*/
56755009Sshin	}
56855009Sshin
56955009Sshin	switch (cmd) {
57055009Sshin	case SIOCGLIFADDR:
57155009Sshin		/* address must be specified on GET with IFLR_PREFIX */
57255009Sshin		if ((iflr->flags & IFLR_PREFIX) == 0)
57355009Sshin			break;
57455009Sshin		/*FALLTHROUGH*/
57555009Sshin	case SIOCALIFADDR:
57655009Sshin	case SIOCDLIFADDR:
57755009Sshin		/* address must be specified on ADD and DELETE */
57855917Sshin		if (iflr->addr.ss_family != AF_INET)
579184295Sbz			return (EINVAL);
58055917Sshin		if (iflr->addr.ss_len != sizeof(struct sockaddr_in))
581184295Sbz			return (EINVAL);
58255009Sshin		/* XXX need improvement */
58355917Sshin		if (iflr->dstaddr.ss_family
58455917Sshin		 && iflr->dstaddr.ss_family != AF_INET)
585184295Sbz			return (EINVAL);
58655917Sshin		if (iflr->dstaddr.ss_family
58755917Sshin		 && iflr->dstaddr.ss_len != sizeof(struct sockaddr_in))
588184295Sbz			return (EINVAL);
58955009Sshin		break;
59055009Sshin	default: /*shouldn't happen*/
591184295Sbz		return (EOPNOTSUPP);
59255009Sshin	}
59355009Sshin	if (sizeof(struct in_addr) * 8 < iflr->prefixlen)
594184295Sbz		return (EINVAL);
59555009Sshin
59655009Sshin	switch (cmd) {
59755009Sshin	case SIOCALIFADDR:
59855009Sshin	    {
59955009Sshin		struct in_aliasreq ifra;
60055009Sshin
60155009Sshin		if (iflr->flags & IFLR_PREFIX)
602184295Sbz			return (EINVAL);
60355009Sshin
60455009Sshin		/* copy args to in_aliasreq, perform ioctl(SIOCAIFADDR_IN6). */
60555009Sshin		bzero(&ifra, sizeof(ifra));
60655009Sshin		bcopy(iflr->iflr_name, ifra.ifra_name,
60755009Sshin			sizeof(ifra.ifra_name));
60855009Sshin
60955917Sshin		bcopy(&iflr->addr, &ifra.ifra_addr, iflr->addr.ss_len);
61055009Sshin
61155917Sshin		if (iflr->dstaddr.ss_family) {	/*XXX*/
61255009Sshin			bcopy(&iflr->dstaddr, &ifra.ifra_dstaddr,
61355917Sshin				iflr->dstaddr.ss_len);
61455009Sshin		}
61555009Sshin
61655009Sshin		ifra.ifra_mask.sin_family = AF_INET;
61755009Sshin		ifra.ifra_mask.sin_len = sizeof(struct sockaddr_in);
61855009Sshin		in_len2mask(&ifra.ifra_mask.sin_addr, iflr->prefixlen);
61955009Sshin
620184295Sbz		return (in_control(so, SIOCAIFADDR, (caddr_t)&ifra, ifp, td));
62155009Sshin	    }
62255009Sshin	case SIOCGLIFADDR:
62355009Sshin	case SIOCDLIFADDR:
62455009Sshin	    {
62555009Sshin		struct in_ifaddr *ia;
62655009Sshin		struct in_addr mask, candidate, match;
62755009Sshin		struct sockaddr_in *sin;
62855009Sshin
62955009Sshin		bzero(&mask, sizeof(mask));
630170855Smjacob		bzero(&match, sizeof(match));
63155009Sshin		if (iflr->flags & IFLR_PREFIX) {
63255009Sshin			/* lookup a prefix rather than address. */
63355009Sshin			in_len2mask(&mask, iflr->prefixlen);
63455009Sshin
63555009Sshin			sin = (struct sockaddr_in *)&iflr->addr;
63655009Sshin			match.s_addr = sin->sin_addr.s_addr;
63755009Sshin			match.s_addr &= mask.s_addr;
63855009Sshin
63955009Sshin			/* if you set extra bits, that's wrong */
64055009Sshin			if (match.s_addr != sin->sin_addr.s_addr)
641184295Sbz				return (EINVAL);
64255009Sshin
64355009Sshin		} else {
644170855Smjacob			/* on getting an address, take the 1st match */
645170855Smjacob			/* on deleting an address, do exact match */
646170855Smjacob			if (cmd != SIOCGLIFADDR) {
64755009Sshin				in_len2mask(&mask, 32);
64855009Sshin				sin = (struct sockaddr_in *)&iflr->addr;
64955009Sshin				match.s_addr = sin->sin_addr.s_addr;
65055009Sshin			}
65155009Sshin		}
65255009Sshin
65355009Sshin		TAILQ_FOREACH(ifa, &ifp->if_addrhead, ifa_link)	{
65455009Sshin			if (ifa->ifa_addr->sa_family != AF_INET6)
65555009Sshin				continue;
656170855Smjacob			if (match.s_addr == 0)
65755009Sshin				break;
65855009Sshin			candidate.s_addr = ((struct sockaddr_in *)&ifa->ifa_addr)->sin_addr.s_addr;
65955009Sshin			candidate.s_addr &= mask.s_addr;
66055009Sshin			if (candidate.s_addr == match.s_addr)
66155009Sshin				break;
66255009Sshin		}
663184295Sbz		if (ifa == NULL)
664184295Sbz			return (EADDRNOTAVAIL);
66555009Sshin		ia = (struct in_ifaddr *)ifa;
66655009Sshin
66755009Sshin		if (cmd == SIOCGLIFADDR) {
66855009Sshin			/* fill in the if_laddrreq structure */
66955009Sshin			bcopy(&ia->ia_addr, &iflr->addr, ia->ia_addr.sin_len);
67055009Sshin
67155009Sshin			if ((ifp->if_flags & IFF_POINTOPOINT) != 0) {
67255009Sshin				bcopy(&ia->ia_dstaddr, &iflr->dstaddr,
67355009Sshin					ia->ia_dstaddr.sin_len);
67455009Sshin			} else
67555009Sshin				bzero(&iflr->dstaddr, sizeof(iflr->dstaddr));
67655009Sshin
67755009Sshin			iflr->prefixlen =
67855009Sshin				in_mask2len(&ia->ia_sockmask.sin_addr);
67955009Sshin
68055009Sshin			iflr->flags = 0;	/*XXX*/
68155009Sshin
682184295Sbz			return (0);
68355009Sshin		} else {
68455009Sshin			struct in_aliasreq ifra;
68555009Sshin
68655009Sshin			/* fill in_aliasreq and do ioctl(SIOCDIFADDR_IN6) */
68755009Sshin			bzero(&ifra, sizeof(ifra));
68855009Sshin			bcopy(iflr->iflr_name, ifra.ifra_name,
68955009Sshin				sizeof(ifra.ifra_name));
69055009Sshin
69155009Sshin			bcopy(&ia->ia_addr, &ifra.ifra_addr,
69255009Sshin				ia->ia_addr.sin_len);
69355009Sshin			if ((ifp->if_flags & IFF_POINTOPOINT) != 0) {
69455009Sshin				bcopy(&ia->ia_dstaddr, &ifra.ifra_dstaddr,
69555009Sshin					ia->ia_dstaddr.sin_len);
69655009Sshin			}
69755009Sshin			bcopy(&ia->ia_sockmask, &ifra.ifra_dstaddr,
69855009Sshin				ia->ia_sockmask.sin_len);
69955009Sshin
700184295Sbz			return (in_control(so, SIOCDIFADDR, (caddr_t)&ifra,
701184295Sbz			    ifp, td));
70255009Sshin		}
70355009Sshin	    }
70455009Sshin	}
70555009Sshin
706184295Sbz	return (EOPNOTSUPP);	/*just for safety*/
70755009Sshin}
70855009Sshin
70955009Sshin/*
7101541Srgrimes * Delete any existing route for an interface.
7111541Srgrimes */
71222672Swollmanvoid
713169454Srwatsonin_ifscrub(struct ifnet *ifp, struct in_ifaddr *ia)
7141541Srgrimes{
715169454Srwatson
716137628Smlaier	in_scrubprefix(ia);
7171541Srgrimes}
7181541Srgrimes
7191541Srgrimes/*
7201541Srgrimes * Initialize an interface's internet address
7211541Srgrimes * and routing table entry.
7221541Srgrimes */
72312296Sphkstatic int
724169454Srwatsonin_ifinit(struct ifnet *ifp, struct in_ifaddr *ia, struct sockaddr_in *sin,
725169454Srwatson    int scrub)
7261541Srgrimes{
727183550Szec	INIT_VNET_INET(ifp->if_vnet);
7281541Srgrimes	register u_long i = ntohl(sin->sin_addr.s_addr);
7291541Srgrimes	struct sockaddr_in oldaddr;
73094326Sbrian	int s = splimp(), flags = RTF_UP, error = 0;
7311541Srgrimes
7321541Srgrimes	oldaddr = ia->ia_addr;
733105748Ssuz	if (oldaddr.sin_family == AF_INET)
734105748Ssuz		LIST_REMOVE(ia, ia_hash);
7351541Srgrimes	ia->ia_addr = *sin;
736105748Ssuz	if (ia->ia_addr.sin_family == AF_INET)
737105748Ssuz		LIST_INSERT_HEAD(INADDR_HASH(ia->ia_addr.sin_addr.s_addr),
738105748Ssuz		    ia, ia_hash);
7391541Srgrimes	/*
7401541Srgrimes	 * Give the interface a chance to initialize
7411541Srgrimes	 * if this is its first address,
7421541Srgrimes	 * and to validate the address if necessary.
7431541Srgrimes	 */
744184295Sbz	if (ifp->if_ioctl != NULL) {
745146883Siedowse		IFF_LOCKGIANT(ifp);
746146883Siedowse		error = (*ifp->if_ioctl)(ifp, SIOCSIFADDR, (caddr_t)ia);
747146883Siedowse		IFF_UNLOCKGIANT(ifp);
748146883Siedowse		if (error) {
749146883Siedowse			splx(s);
750146883Siedowse			/* LIST_REMOVE(ia, ia_hash) is done in in_control */
751146883Siedowse			ia->ia_addr = oldaddr;
752146883Siedowse			if (ia->ia_addr.sin_family == AF_INET)
753146883Siedowse				LIST_INSERT_HEAD(INADDR_HASH(
754146883Siedowse				    ia->ia_addr.sin_addr.s_addr), ia, ia_hash);
755179971Sgonzo			else
756179971Sgonzo				/*
757179971Sgonzo				 * If oldaddr family is not AF_INET (e.g.
758179971Sgonzo				 * interface has been just created) in_control
759179971Sgonzo				 * does not call LIST_REMOVE, and we end up
760179971Sgonzo				 * with bogus ia entries in hash
761179971Sgonzo				 */
762179971Sgonzo				LIST_REMOVE(ia, ia_hash);
763146883Siedowse			return (error);
764146883Siedowse		}
7651541Srgrimes	}
7661541Srgrimes	splx(s);
7671541Srgrimes	if (scrub) {
7681541Srgrimes		ia->ia_ifa.ifa_addr = (struct sockaddr *)&oldaddr;
7691541Srgrimes		in_ifscrub(ifp, ia);
7701541Srgrimes		ia->ia_ifa.ifa_addr = (struct sockaddr *)&ia->ia_addr;
7711541Srgrimes	}
7721541Srgrimes	if (IN_CLASSA(i))
7731541Srgrimes		ia->ia_netmask = IN_CLASSA_NET;
7741541Srgrimes	else if (IN_CLASSB(i))
7751541Srgrimes		ia->ia_netmask = IN_CLASSB_NET;
7761541Srgrimes	else
7771541Srgrimes		ia->ia_netmask = IN_CLASSC_NET;
7781541Srgrimes	/*
7791541Srgrimes	 * The subnet mask usually includes at least the standard network part,
7801541Srgrimes	 * but may may be smaller in the case of supernetting.
7811541Srgrimes	 * If it is set, we believe it.
7821541Srgrimes	 */
7831541Srgrimes	if (ia->ia_subnetmask == 0) {
7841541Srgrimes		ia->ia_subnetmask = ia->ia_netmask;
7851541Srgrimes		ia->ia_sockmask.sin_addr.s_addr = htonl(ia->ia_subnetmask);
7861541Srgrimes	} else
7871541Srgrimes		ia->ia_netmask &= ia->ia_subnetmask;
7881541Srgrimes	ia->ia_net = i & ia->ia_netmask;
7891541Srgrimes	ia->ia_subnet = i & ia->ia_subnetmask;
7901541Srgrimes	in_socktrim(&ia->ia_sockmask);
791143868Sglebius#ifdef DEV_CARP
7921541Srgrimes	/*
793143868Sglebius	 * XXX: carp(4) does not have interface route
794143868Sglebius	 */
795143868Sglebius	if (ifp->if_type == IFT_CARP)
796143868Sglebius		return (0);
797143868Sglebius#endif
798143868Sglebius	/*
7991541Srgrimes	 * Add route for the network.
8001541Srgrimes	 */
8011541Srgrimes	ia->ia_ifa.ifa_metric = ifp->if_metric;
8021541Srgrimes	if (ifp->if_flags & IFF_BROADCAST) {
8031541Srgrimes		ia->ia_broadaddr.sin_addr.s_addr =
8041541Srgrimes			htonl(ia->ia_subnet | ~ia->ia_subnetmask);
8051541Srgrimes		ia->ia_netbroadcast.s_addr =
8061541Srgrimes			htonl(ia->ia_net | ~ ia->ia_netmask);
8071541Srgrimes	} else if (ifp->if_flags & IFF_LOOPBACK) {
808137833Smlaier		ia->ia_dstaddr = ia->ia_addr;
8091541Srgrimes		flags |= RTF_HOST;
8101541Srgrimes	} else if (ifp->if_flags & IFF_POINTOPOINT) {
8111541Srgrimes		if (ia->ia_dstaddr.sin_family != AF_INET)
8121541Srgrimes			return (0);
8131541Srgrimes		flags |= RTF_HOST;
8141541Srgrimes	}
815137628Smlaier	if ((error = in_addprefix(ia, flags)) != 0)
816137628Smlaier		return (error);
81794326Sbrian
8181541Srgrimes	return (error);
8191541Srgrimes}
8201541Srgrimes
821137628Smlaier#define rtinitflags(x) \
822137628Smlaier	((((x)->ia_ifp->if_flags & (IFF_LOOPBACK | IFF_POINTOPOINT)) != 0) \
823137628Smlaier	    ? RTF_HOST : 0)
824137628Smlaier/*
825170855Smjacob * Check if we have a route for the given prefix already or add one accordingly.
826137628Smlaier */
827137628Smlaierstatic int
828169454Srwatsonin_addprefix(struct in_ifaddr *target, int flags)
829137628Smlaier{
830183550Szec	INIT_VNET_INET(curvnet);
831137628Smlaier	struct in_ifaddr *ia;
832151555Sglebius	struct in_addr prefix, mask, p, m;
833137628Smlaier	int error;
8341541Srgrimes
835170855Smjacob	if ((flags & RTF_HOST) != 0) {
836137628Smlaier		prefix = target->ia_dstaddr.sin_addr;
837170855Smjacob		mask.s_addr = 0;
838170855Smjacob	} else {
839137628Smlaier		prefix = target->ia_addr.sin_addr;
840137628Smlaier		mask = target->ia_sockmask.sin_addr;
841137628Smlaier		prefix.s_addr &= mask.s_addr;
842137628Smlaier	}
843137628Smlaier
844181803Sbz	TAILQ_FOREACH(ia, &V_in_ifaddrhead, ia_link) {
845151555Sglebius		if (rtinitflags(ia)) {
846137628Smlaier			p = ia->ia_addr.sin_addr;
847151555Sglebius
848151555Sglebius			if (prefix.s_addr != p.s_addr)
849151555Sglebius				continue;
850151555Sglebius		} else {
851151555Sglebius			p = ia->ia_addr.sin_addr;
852151555Sglebius			m = ia->ia_sockmask.sin_addr;
853151555Sglebius			p.s_addr &= m.s_addr;
854151555Sglebius
855151555Sglebius			if (prefix.s_addr != p.s_addr ||
856151555Sglebius			    mask.s_addr != m.s_addr)
857151555Sglebius				continue;
858137628Smlaier		}
859137628Smlaier
860137628Smlaier		/*
861137628Smlaier		 * If we got a matching prefix route inserted by other
862137628Smlaier		 * interface address, we are done here.
863137628Smlaier		 */
864149221Sglebius		if (ia->ia_flags & IFA_ROUTE) {
865181803Sbz			if (V_sameprefixcarponly &&
866149221Sglebius			    target->ia_ifp->if_type != IFT_CARP &&
867149221Sglebius			    ia->ia_ifp->if_type != IFT_CARP)
868149221Sglebius				return (EEXIST);
869149221Sglebius			else
870149221Sglebius				return (0);
871149221Sglebius		}
872137628Smlaier	}
873137628Smlaier
874137628Smlaier	/*
875137628Smlaier	 * No-one seem to have this prefix route, so we try to insert it.
876137628Smlaier	 */
877137628Smlaier	error = rtinit(&target->ia_ifa, (int)RTM_ADD, flags);
878137628Smlaier	if (!error)
879137628Smlaier		target->ia_flags |= IFA_ROUTE;
880184295Sbz	return (error);
881137628Smlaier}
882137628Smlaier
883186119Sqingliextern void arp_ifscrub(struct ifnet *ifp, uint32_t addr);
884186119Sqingli
8851541Srgrimes/*
886137628Smlaier * If there is no other address in the system that can serve a route to the
887137628Smlaier * same prefix, remove the route.  Hand over the route to the new address
888137628Smlaier * otherwise.
889137628Smlaier */
890137628Smlaierstatic int
891169454Srwatsonin_scrubprefix(struct in_ifaddr *target)
892137628Smlaier{
893183550Szec	INIT_VNET_INET(curvnet);
894137628Smlaier	struct in_ifaddr *ia;
895137628Smlaier	struct in_addr prefix, mask, p;
896137628Smlaier	int error;
897137628Smlaier
898137628Smlaier	if ((target->ia_flags & IFA_ROUTE) == 0)
899184295Sbz		return (0);
900137628Smlaier
901137628Smlaier	if (rtinitflags(target))
902137628Smlaier		prefix = target->ia_dstaddr.sin_addr;
903137628Smlaier	else {
904137628Smlaier		prefix = target->ia_addr.sin_addr;
905137628Smlaier		mask = target->ia_sockmask.sin_addr;
906137628Smlaier		prefix.s_addr &= mask.s_addr;
907186119Sqingli		/* remove arp cache */
908186119Sqingli		arp_ifscrub(target->ia_ifp, IA_SIN(target)->sin_addr.s_addr);
909137628Smlaier	}
910137628Smlaier
911181803Sbz	TAILQ_FOREACH(ia, &V_in_ifaddrhead, ia_link) {
912137628Smlaier		if (rtinitflags(ia))
913137628Smlaier			p = ia->ia_dstaddr.sin_addr;
914137628Smlaier		else {
915137628Smlaier			p = ia->ia_addr.sin_addr;
916137628Smlaier			p.s_addr &= ia->ia_sockmask.sin_addr.s_addr;
917137628Smlaier		}
918137628Smlaier
919137628Smlaier		if (prefix.s_addr != p.s_addr)
920137628Smlaier			continue;
921137628Smlaier
922137628Smlaier		/*
923137628Smlaier		 * If we got a matching prefix address, move IFA_ROUTE and
924137628Smlaier		 * the route itself to it.  Make sure that routing daemons
925137628Smlaier		 * get a heads-up.
926143868Sglebius		 *
927143868Sglebius		 * XXX: a special case for carp(4) interface
928137628Smlaier		 */
929143868Sglebius		if ((ia->ia_flags & IFA_ROUTE) == 0
930143868Sglebius#ifdef DEV_CARP
931143868Sglebius		    && (ia->ia_ifp->if_type != IFT_CARP)
932143868Sglebius#endif
933143868Sglebius							) {
934137628Smlaier			rtinit(&(target->ia_ifa), (int)RTM_DELETE,
935137628Smlaier			    rtinitflags(target));
936137628Smlaier			target->ia_flags &= ~IFA_ROUTE;
937137628Smlaier
938137628Smlaier			error = rtinit(&ia->ia_ifa, (int)RTM_ADD,
939137628Smlaier			    rtinitflags(ia) | RTF_UP);
940137628Smlaier			if (error == 0)
941137628Smlaier				ia->ia_flags |= IFA_ROUTE;
942184295Sbz			return (error);
943137628Smlaier		}
944137628Smlaier	}
945137628Smlaier
946137628Smlaier	/*
947137628Smlaier	 * As no-one seem to have this prefix, we can remove the route.
948137628Smlaier	 */
949137628Smlaier	rtinit(&(target->ia_ifa), (int)RTM_DELETE, rtinitflags(target));
950137628Smlaier	target->ia_flags &= ~IFA_ROUTE;
951184295Sbz	return (0);
952137628Smlaier}
953137628Smlaier
954137628Smlaier#undef rtinitflags
955137628Smlaier
956137628Smlaier/*
9571541Srgrimes * Return 1 if the address might be a local broadcast address.
9581541Srgrimes */
9591549Srgrimesint
960169454Srwatsonin_broadcast(struct in_addr in, struct ifnet *ifp)
9611541Srgrimes{
9621541Srgrimes	register struct ifaddr *ifa;
9631541Srgrimes	u_long t;
9641541Srgrimes
9651541Srgrimes	if (in.s_addr == INADDR_BROADCAST ||
9661541Srgrimes	    in.s_addr == INADDR_ANY)
967184295Sbz		return (1);
9681541Srgrimes	if ((ifp->if_flags & IFF_BROADCAST) == 0)
969184295Sbz		return (0);
9701541Srgrimes	t = ntohl(in.s_addr);
9711541Srgrimes	/*
9721541Srgrimes	 * Look through the list of addresses for a match
9731541Srgrimes	 * with a broadcast address.
9741541Srgrimes	 */
9751541Srgrimes#define ia ((struct in_ifaddr *)ifa)
97674362Sphk	TAILQ_FOREACH(ifa, &ifp->if_addrhead, ifa_link)
9771541Srgrimes		if (ifa->ifa_addr->sa_family == AF_INET &&
9781541Srgrimes		    (in.s_addr == ia->ia_broadaddr.sin_addr.s_addr ||
9791541Srgrimes		     in.s_addr == ia->ia_netbroadcast.s_addr ||
9801541Srgrimes		     /*
9811541Srgrimes		      * Check for old-style (host 0) broadcast.
9821541Srgrimes		      */
98313351Sguido		     t == ia->ia_subnet || t == ia->ia_net) &&
98413351Sguido		     /*
98513351Sguido		      * Check for an all one subnetmask. These
98613351Sguido		      * only exist when an interface gets a secondary
98713351Sguido		      * address.
98813351Sguido		      */
98913351Sguido		     ia->ia_subnetmask != (u_long)0xffffffff)
990184295Sbz			    return (1);
9911541Srgrimes	return (0);
9921541Srgrimes#undef ia
9931541Srgrimes}
994167729Sbms
9951541Srgrimes/*
996167729Sbms * Delete all IPv4 multicast address records, and associated link-layer
997167729Sbms * multicast address records, associated with ifp.
998162718Sbms */
999167729Sbmsstatic void
1000167729Sbmsin_purgemaddrs(struct ifnet *ifp)
1001162718Sbms{
1002183550Szec	INIT_VNET_INET(ifp->if_vnet);
1003162718Sbms	struct in_multi *inm;
1004162718Sbms	struct in_multi *oinm;
1005162718Sbms
1006162718Sbms	IFF_LOCKGIANT(ifp);
1007162718Sbms	IN_MULTI_LOCK();
1008181803Sbz	LIST_FOREACH_SAFE(inm, &V_in_multihead, inm_link, oinm) {
1009162718Sbms		if (inm->inm_ifp == ifp)
1010162718Sbms			in_delmulti_locked(inm);
1011162718Sbms	}
1012150853Srwatson	IN_MULTI_UNLOCK();
1013150852Srwatson	IFF_UNLOCKGIANT(ifp);
10141541Srgrimes}
1015150296Srwatson
1016150296Srwatson/*
1017150296Srwatson * On interface removal, clean up IPv4 data structures hung off of the ifnet.
1018150296Srwatson */
1019150296Srwatsonvoid
1020169454Srwatsonin_ifdetach(struct ifnet *ifp)
1021150296Srwatson{
1022183550Szec	INIT_VNET_INET(ifp->if_vnet);
1023150296Srwatson
1024181803Sbz	in_pcbpurgeif0(&V_ripcbinfo, ifp);
1025181803Sbz	in_pcbpurgeif0(&V_udbinfo, ifp);
1026167729Sbms	in_purgemaddrs(ifp);
1027150296Srwatson}
1028186119Sqingli
1029186119Sqingli#include <sys/syslog.h>
1030186119Sqingli#include <net/if_dl.h>
1031186119Sqingli#include <netinet/if_ether.h>
1032186119Sqingli
1033186119Sqinglistruct in_llentry {
1034186119Sqingli	struct llentry		base;
1035186119Sqingli	struct sockaddr_in	l3_addr4;
1036186119Sqingli};
1037186119Sqingli
1038186119Sqinglistatic struct llentry *
1039186119Sqingliin_lltable_new(const struct sockaddr *l3addr, u_int flags)
1040186119Sqingli{
1041186119Sqingli	struct in_llentry *lle;
1042186119Sqingli
1043186119Sqingli	lle = malloc(sizeof(struct in_llentry), M_LLTABLE, M_DONTWAIT | M_ZERO);
1044186119Sqingli	if (lle == NULL)		/* NB: caller generates msg */
1045186119Sqingli		return NULL;
1046186119Sqingli
1047186119Sqingli	callout_init(&lle->base.la_timer, CALLOUT_MPSAFE);
1048186119Sqingli	/*
1049186119Sqingli	 * For IPv4 this will trigger "arpresolve" to generate
1050186119Sqingli	 * an ARP request.
1051186119Sqingli	 */
1052186119Sqingli	lle->base.la_expire = time_second; /* mark expired */
1053186119Sqingli	lle->l3_addr4 = *(const struct sockaddr_in *)l3addr;
1054186119Sqingli	lle->base.lle_refcnt = 1;
1055186119Sqingli	LLE_LOCK_INIT(&lle->base);
1056186119Sqingli	return &lle->base;
1057186119Sqingli}
1058186119Sqingli
1059186119Sqingli/*
1060186119Sqingli * Deletes an address from the address table.
1061186119Sqingli * This function is called by the timer functions
1062186119Sqingli * such as arptimer() and nd6_llinfo_timer(), and
1063186119Sqingli * the caller does the locking.
1064186119Sqingli */
1065186119Sqinglistatic void
1066186119Sqingliin_lltable_free(struct lltable *llt, struct llentry *lle)
1067186119Sqingli{
1068186150Skmacy	LLE_WUNLOCK(lle);
1069186150Skmacy	LLE_LOCK_DESTROY(lle);
1070186119Sqingli	free(lle, M_LLTABLE);
1071186119Sqingli}
1072186119Sqingli
1073186119Sqinglistatic int
1074186119Sqingliin_lltable_rtcheck(struct ifnet *ifp, const struct sockaddr *l3addr)
1075186119Sqingli{
1076186119Sqingli	struct rtentry *rt;
1077186119Sqingli
1078186119Sqingli	KASSERT(l3addr->sa_family == AF_INET,
1079186119Sqingli	    ("sin_family %d", l3addr->sa_family));
1080186119Sqingli
1081186119Sqingli	/* XXX rtalloc1 should take a const param */
1082186119Sqingli	rt = rtalloc1(__DECONST(struct sockaddr *, l3addr), 0, 0);
1083186119Sqingli	if (rt == NULL || (rt->rt_flags & RTF_GATEWAY) || rt->rt_ifp != ifp) {
1084186119Sqingli		log(LOG_INFO, "IPv4 address: \"%s\" is not on the network\n",
1085186119Sqingli		    inet_ntoa(((const struct sockaddr_in *)l3addr)->sin_addr));
1086186119Sqingli		if (rt != NULL)
1087186119Sqingli			RTFREE_LOCKED(rt);
1088186119Sqingli		return (EINVAL);
1089186119Sqingli	}
1090186119Sqingli	RTFREE_LOCKED(rt);
1091186119Sqingli	return 0;
1092186119Sqingli}
1093186119Sqingli
1094186119Sqingli/*
1095186119Sqingli * Return NULL if not found or marked for deletion.
1096186119Sqingli * If found return lle read locked.
1097186119Sqingli */
1098186119Sqinglistatic struct llentry *
1099186119Sqingliin_lltable_lookup(struct lltable *llt, u_int flags, const struct sockaddr *l3addr)
1100186119Sqingli{
1101186119Sqingli	const struct sockaddr_in *sin = (const struct sockaddr_in *)l3addr;
1102186119Sqingli	struct ifnet *ifp = llt->llt_ifp;
1103186119Sqingli	struct llentry *lle;
1104186119Sqingli	struct llentries *lleh;
1105186119Sqingli	u_int hashkey;
1106186119Sqingli
1107186119Sqingli	IF_AFDATA_LOCK_ASSERT(ifp);
1108186119Sqingli	KASSERT(l3addr->sa_family == AF_INET,
1109186119Sqingli	    ("sin_family %d", l3addr->sa_family));
1110186119Sqingli
1111186119Sqingli	hashkey = sin->sin_addr.s_addr;
1112186119Sqingli	lleh = &llt->lle_head[LLATBL_HASH(hashkey, LLTBL_HASHMASK)];
1113186119Sqingli	LIST_FOREACH(lle, lleh, lle_next) {
1114186708Sqingli		struct sockaddr_in *sa2 = (struct sockaddr_in *)L3_ADDR(lle);
1115186119Sqingli		if (lle->la_flags & LLE_DELETED)
1116186119Sqingli			continue;
1117186708Sqingli		if (sa2->sin_addr.s_addr == sin->sin_addr.s_addr)
1118186119Sqingli			break;
1119186119Sqingli	}
1120186119Sqingli	if (lle == NULL) {
1121186119Sqingli#ifdef DIAGNOSTICS
1122186119Sqingli		if (flags & LLE_DELETE)
1123186119Sqingli			log(LOG_INFO, "interface address is missing from cache = %p  in delete\n", lle);
1124186119Sqingli#endif
1125186119Sqingli		if (!(flags & LLE_CREATE))
1126186119Sqingli			return (NULL);
1127186119Sqingli		/*
1128186119Sqingli		 * A route that covers the given address must have
1129186119Sqingli		 * been installed 1st because we are doing a resolution,
1130186119Sqingli		 * verify this.
1131186119Sqingli		 */
1132186119Sqingli		if (!(flags & LLE_IFADDR) &&
1133186119Sqingli		    in_lltable_rtcheck(ifp, l3addr) != 0)
1134186119Sqingli			goto done;
1135186119Sqingli
1136186119Sqingli		lle = in_lltable_new(l3addr, flags);
1137186119Sqingli		if (lle == NULL) {
1138186119Sqingli			log(LOG_INFO, "lla_lookup: new lle malloc failed\n");
1139186119Sqingli			goto done;
1140186119Sqingli		}
1141186119Sqingli		lle->la_flags = flags & ~LLE_CREATE;
1142186119Sqingli		if ((flags & (LLE_CREATE | LLE_IFADDR)) == (LLE_CREATE | LLE_IFADDR)) {
1143186119Sqingli			bcopy(IF_LLADDR(ifp), &lle->ll_addr, ifp->if_addrlen);
1144186119Sqingli			lle->la_flags |= (LLE_VALID | LLE_STATIC);
1145186119Sqingli		}
1146186119Sqingli
1147186119Sqingli		lle->lle_tbl  = llt;
1148186119Sqingli		lle->lle_head = lleh;
1149186119Sqingli		LIST_INSERT_HEAD(lleh, lle, lle_next);
1150186119Sqingli	} else if (flags & LLE_DELETE) {
1151186119Sqingli		if (!(lle->la_flags & LLE_IFADDR) || (flags & LLE_IFADDR)) {
1152186119Sqingli			LLE_WLOCK(lle);
1153186119Sqingli			lle->la_flags = LLE_DELETED;
1154186119Sqingli			LLE_WUNLOCK(lle);
1155186119Sqingli#ifdef DIAGNOSTICS
1156186119Sqingli			log(LOG_INFO, "ifaddr cache = %p  is deleted\n", lle);
1157186119Sqingli#endif
1158186119Sqingli		}
1159186119Sqingli		lle = (void *)-1;
1160186119Sqingli
1161186119Sqingli	}
1162186544Sbz	if (LLE_IS_VALID(lle)) {
1163186119Sqingli		if (flags & LLE_EXCLUSIVE)
1164186119Sqingli			LLE_WLOCK(lle);
1165186119Sqingli		else
1166186119Sqingli			LLE_RLOCK(lle);
1167186119Sqingli	}
1168186119Sqinglidone:
1169186119Sqingli	return (lle);
1170186119Sqingli}
1171186119Sqingli
1172186119Sqinglistatic int
1173186119Sqingliin_lltable_dump(struct lltable *llt, struct sysctl_req *wr)
1174186119Sqingli{
1175186119Sqingli#define	SIN(lle)	((struct sockaddr_in *) L3_ADDR(lle))
1176186119Sqingli	struct ifnet *ifp = llt->llt_ifp;
1177186119Sqingli	struct llentry *lle;
1178186119Sqingli	/* XXX stack use */
1179186119Sqingli	struct {
1180186119Sqingli		struct rt_msghdr	rtm;
1181186119Sqingli		struct sockaddr_inarp	sin;
1182186119Sqingli		struct sockaddr_dl	sdl;
1183186119Sqingli	} arpc;
1184186119Sqingli	int error, i;
1185186119Sqingli
1186186119Sqingli	/* XXXXX
1187186119Sqingli	 * current IFNET_RLOCK() is mapped to IFNET_WLOCK()
1188186119Sqingli	 * so it is okay to use this ASSERT, change it when
1189186119Sqingli	 * IFNET lock is finalized
1190186119Sqingli	 */
1191186119Sqingli	IFNET_WLOCK_ASSERT();
1192186119Sqingli
1193186119Sqingli	error = 0;
1194186119Sqingli	for (i = 0; i < LLTBL_HASHTBL_SIZE; i++) {
1195186119Sqingli		LIST_FOREACH(lle, &llt->lle_head[i], lle_next) {
1196186119Sqingli			struct sockaddr_dl *sdl;
1197186119Sqingli
1198186119Sqingli			/* skip deleted entries */
1199186119Sqingli			if ((lle->la_flags & (LLE_DELETED|LLE_VALID)) != LLE_VALID)
1200186119Sqingli				continue;
1201186980Sbz			/* Skip if jailed and not a valid IP of the prison. */
1202188144Sjamie			if (prison_if(wr->td->td_ucred, L3_ADDR(lle)) != 0)
1203186980Sbz				continue;
1204186119Sqingli			/*
1205186119Sqingli			 * produce a msg made of:
1206186119Sqingli			 *  struct rt_msghdr;
1207186119Sqingli			 *  struct sockaddr_inarp; (IPv4)
1208186119Sqingli			 *  struct sockaddr_dl;
1209186119Sqingli			 */
1210186119Sqingli			bzero(&arpc, sizeof(arpc));
1211186119Sqingli			arpc.rtm.rtm_msglen = sizeof(arpc);
1212186935Sharti			arpc.rtm.rtm_version = RTM_VERSION;
1213186935Sharti			arpc.rtm.rtm_type = RTM_GET;
1214186935Sharti			arpc.rtm.rtm_flags = RTF_UP;
1215186935Sharti			arpc.rtm.rtm_addrs = RTA_DST | RTA_GATEWAY;
1216186119Sqingli			arpc.sin.sin_family = AF_INET;
1217186119Sqingli			arpc.sin.sin_len = sizeof(arpc.sin);
1218186119Sqingli			arpc.sin.sin_addr.s_addr = SIN(lle)->sin_addr.s_addr;
1219186119Sqingli
1220186119Sqingli			/* publish */
1221186119Sqingli			if (lle->la_flags & LLE_PUB) {
1222186119Sqingli				arpc.rtm.rtm_flags |= RTF_ANNOUNCE;
1223186119Sqingli				/* proxy only */
1224186119Sqingli				if (lle->la_flags & LLE_PROXY)
1225186119Sqingli					arpc.sin.sin_other = SIN_PROXY;
1226186119Sqingli			}
1227186119Sqingli
1228186119Sqingli			sdl = &arpc.sdl;
1229186119Sqingli			sdl->sdl_family = AF_LINK;
1230186119Sqingli			sdl->sdl_len = sizeof(*sdl);
1231186119Sqingli			sdl->sdl_alen = ifp->if_addrlen;
1232186119Sqingli			sdl->sdl_index = ifp->if_index;
1233186119Sqingli			sdl->sdl_type = ifp->if_type;
1234186119Sqingli			bcopy(&lle->ll_addr, LLADDR(sdl), ifp->if_addrlen);
1235186119Sqingli
1236186119Sqingli			arpc.rtm.rtm_rmx.rmx_expire =
1237186119Sqingli			    lle->la_flags & LLE_STATIC ? 0 : lle->la_expire;
1238186500Sqingli			arpc.rtm.rtm_flags |= (RTF_HOST | RTF_LLDATA);
1239186119Sqingli			if (lle->la_flags & LLE_STATIC)
1240186119Sqingli				arpc.rtm.rtm_flags |= RTF_STATIC;
1241186119Sqingli			arpc.rtm.rtm_index = ifp->if_index;
1242186119Sqingli			error = SYSCTL_OUT(wr, &arpc, sizeof(arpc));
1243186119Sqingli			if (error)
1244186119Sqingli				break;
1245186119Sqingli		}
1246186119Sqingli	}
1247186119Sqingli	return error;
1248186119Sqingli#undef SIN
1249186119Sqingli}
1250186119Sqingli
1251186119Sqinglivoid *
1252186119Sqingliin_domifattach(struct ifnet *ifp)
1253186119Sqingli{
1254186119Sqingli	struct lltable *llt = lltable_init(ifp, AF_INET);
1255186119Sqingli
1256186119Sqingli	if (llt != NULL) {
1257186119Sqingli		llt->llt_new = in_lltable_new;
1258186119Sqingli		llt->llt_free = in_lltable_free;
1259186119Sqingli		llt->llt_rtcheck = in_lltable_rtcheck;
1260186119Sqingli		llt->llt_lookup = in_lltable_lookup;
1261186119Sqingli		llt->llt_dump = in_lltable_dump;
1262186119Sqingli	}
1263186119Sqingli	return (llt);
1264186119Sqingli}
1265186119Sqingli
1266186119Sqinglivoid
1267186119Sqingliin_domifdetach(struct ifnet *ifp __unused, void *aux)
1268186119Sqingli{
1269186119Sqingli	struct lltable *llt = (struct lltable *)aux;
1270186119Sqingli
1271186119Sqingli	lltable_free(llt);
1272186119Sqingli}
1273