in.c revision 189592
1139823Simp/*-
21541Srgrimes * Copyright (c) 1982, 1986, 1991, 1993
31541Srgrimes *	The Regents of the University of California.  All rights reserved.
4137668Smlaier * Copyright (C) 2001 WIDE Project.  All rights reserved.
51541Srgrimes *
61541Srgrimes * Redistribution and use in source and binary forms, with or without
71541Srgrimes * modification, are permitted provided that the following conditions
81541Srgrimes * are met:
91541Srgrimes * 1. Redistributions of source code must retain the above copyright
101541Srgrimes *    notice, this list of conditions and the following disclaimer.
111541Srgrimes * 2. Redistributions in binary form must reproduce the above copyright
121541Srgrimes *    notice, this list of conditions and the following disclaimer in the
131541Srgrimes *    documentation and/or other materials provided with the distribution.
141541Srgrimes * 4. Neither the name of the University nor the names of its contributors
151541Srgrimes *    may be used to endorse or promote products derived from this software
161541Srgrimes *    without specific prior written permission.
171541Srgrimes *
181541Srgrimes * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
191541Srgrimes * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
201541Srgrimes * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
211541Srgrimes * ARE DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
221541Srgrimes * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
231541Srgrimes * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
241541Srgrimes * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
251541Srgrimes * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
261541Srgrimes * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
271541Srgrimes * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
281541Srgrimes * SUCH DAMAGE.
291541Srgrimes *
3010939Swollman *	@(#)in.c	8.4 (Berkeley) 1/9/95
311541Srgrimes */
321541Srgrimes
33172467Ssilby#include <sys/cdefs.h>
34172467Ssilby__FBSDID("$FreeBSD: head/sys/netinet/in.c 189592 2009-03-09 17:53:05Z bms $");
35172467Ssilby
36143868Sglebius#include "opt_carp.h"
37143868Sglebius
381541Srgrimes#include <sys/param.h>
391549Srgrimes#include <sys/systm.h>
4024204Sbde#include <sys/sockio.h>
411541Srgrimes#include <sys/malloc.h>
42164033Srwatson#include <sys/priv.h>
431541Srgrimes#include <sys/socket.h>
44186948Sbz#include <sys/jail.h>
4512704Sphk#include <sys/kernel.h>
46186948Sbz#include <sys/proc.h>
4712704Sphk#include <sys/sysctl.h>
48181803Sbz#include <sys/vimage.h>
491541Srgrimes
501541Srgrimes#include <net/if.h>
51186119Sqingli#include <net/if_llatbl.h>
5255009Sshin#include <net/if_types.h>
531541Srgrimes#include <net/route.h>
541541Srgrimes
551541Srgrimes#include <netinet/in.h>
561541Srgrimes#include <netinet/in_var.h>
5781127Sume#include <netinet/in_pcb.h>
58170613Sbms#include <netinet/ip_var.h>
59185571Sbz#include <netinet/vinet.h>
60189592Sbms#include <netinet/igmp_var.h>
611541Srgrimes
6292723Salfredstatic int in_mask2len(struct in_addr *);
6392723Salfredstatic void in_len2mask(struct in_addr *, int);
6492723Salfredstatic int in_lifaddr_ioctl(struct socket *, u_long, caddr_t,
6592723Salfred	struct ifnet *, struct thread *);
6655009Sshin
67137628Smlaierstatic int	in_addprefix(struct in_ifaddr *, int);
68137628Smlaierstatic int	in_scrubprefix(struct in_ifaddr *);
6992723Salfredstatic void	in_socktrim(struct sockaddr_in *);
7092723Salfredstatic int	in_ifinit(struct ifnet *,
7192723Salfred	    struct in_ifaddr *, struct sockaddr_in *, int);
72167729Sbmsstatic void	in_purgemaddrs(struct ifnet *);
731541Srgrimes
74185088Szec#ifdef VIMAGE_GLOBALS
75185088Szecstatic int subnetsarelocal;
76185088Szecstatic int sameprefixcarponly;
77185088Szecextern struct inpcbinfo ripcbinfo;
78185088Szec#endif
79185088Szec
80183550SzecSYSCTL_V_INT(V_NET, vnet_inet, _net_inet_ip, OID_AUTO, subnets_are_local,
81183550Szec	CTLFLAG_RW, subnetsarelocal, 0,
82183550Szec	"Treat all subnets as directly connected");
83183550SzecSYSCTL_V_INT(V_NET, vnet_inet, _net_inet_ip, OID_AUTO, same_prefix_carp_only,
84183550Szec	CTLFLAG_RW, sameprefixcarponly, 0,
85149221Sglebius	"Refuse to create same prefixes on different interfaces");
8621666Swollman
871541Srgrimes/*
881541Srgrimes * Return 1 if an internet address is for a ``local'' host
891541Srgrimes * (one to which we have a connection).  If subnetsarelocal
901541Srgrimes * is true, this includes other subnets of the local net.
911541Srgrimes * Otherwise, it includes only the directly-connected (sub)nets.
921541Srgrimes */
931549Srgrimesint
94169454Srwatsonin_localaddr(struct in_addr in)
951541Srgrimes{
96183550Szec	INIT_VNET_INET(curvnet);
971541Srgrimes	register u_long i = ntohl(in.s_addr);
981541Srgrimes	register struct in_ifaddr *ia;
991541Srgrimes
100181803Sbz	if (V_subnetsarelocal) {
101181803Sbz		TAILQ_FOREACH(ia, &V_in_ifaddrhead, ia_link)
1021541Srgrimes			if ((i & ia->ia_netmask) == ia->ia_net)
1031541Srgrimes				return (1);
1041541Srgrimes	} else {
105181803Sbz		TAILQ_FOREACH(ia, &V_in_ifaddrhead, ia_link)
1061541Srgrimes			if ((i & ia->ia_subnetmask) == ia->ia_subnet)
1071541Srgrimes				return (1);
1081541Srgrimes	}
1091541Srgrimes	return (0);
1101541Srgrimes}
1111541Srgrimes
1121541Srgrimes/*
113133486Sandre * Return 1 if an internet address is for the local host and configured
114133486Sandre * on one of its interfaces.
115133486Sandre */
116133486Sandreint
117169454Srwatsonin_localip(struct in_addr in)
118133486Sandre{
119183550Szec	INIT_VNET_INET(curvnet);
120133486Sandre	struct in_ifaddr *ia;
121133486Sandre
122133486Sandre	LIST_FOREACH(ia, INADDR_HASH(in.s_addr), ia_hash) {
123133486Sandre		if (IA_SIN(ia)->sin_addr.s_addr == in.s_addr)
124184295Sbz			return (1);
125133486Sandre	}
126184295Sbz	return (0);
127133486Sandre}
128133486Sandre
129133486Sandre/*
1301541Srgrimes * Determine whether an IP address is in a reserved set of addresses
1311541Srgrimes * that may not be forwarded, or whether datagrams to that destination
1321541Srgrimes * may be forwarded.
1331541Srgrimes */
1341549Srgrimesint
135169454Srwatsonin_canforward(struct in_addr in)
1361541Srgrimes{
1371541Srgrimes	register u_long i = ntohl(in.s_addr);
1381541Srgrimes	register u_long net;
1391541Srgrimes
140166450Sbms	if (IN_EXPERIMENTAL(i) || IN_MULTICAST(i) || IN_LINKLOCAL(i))
1411541Srgrimes		return (0);
1421541Srgrimes	if (IN_CLASSA(i)) {
1431541Srgrimes		net = i & IN_CLASSA_NET;
1441541Srgrimes		if (net == 0 || net == (IN_LOOPBACKNET << IN_CLASSA_NSHIFT))
1451541Srgrimes			return (0);
1461541Srgrimes	}
1471541Srgrimes	return (1);
1481541Srgrimes}
1491541Srgrimes
1501541Srgrimes/*
1511541Srgrimes * Trim a mask in a sockaddr
1521541Srgrimes */
15312296Sphkstatic void
154169454Srwatsonin_socktrim(struct sockaddr_in *ap)
1551541Srgrimes{
1561541Srgrimes    register char *cplim = (char *) &ap->sin_addr;
1571541Srgrimes    register char *cp = (char *) (&ap->sin_addr + 1);
1581541Srgrimes
1591541Srgrimes    ap->sin_len = 0;
1604127Swollman    while (--cp >= cplim)
161133874Srwatson	if (*cp) {
1621541Srgrimes	    (ap)->sin_len = cp - (char *) (ap) + 1;
1631541Srgrimes	    break;
1641541Srgrimes	}
1651541Srgrimes}
1661541Srgrimes
16755009Sshinstatic int
16855009Sshinin_mask2len(mask)
16955009Sshin	struct in_addr *mask;
17055009Sshin{
17155009Sshin	int x, y;
17255009Sshin	u_char *p;
17355009Sshin
17455009Sshin	p = (u_char *)mask;
17555009Sshin	for (x = 0; x < sizeof(*mask); x++) {
17655009Sshin		if (p[x] != 0xff)
17755009Sshin			break;
17855009Sshin	}
17955009Sshin	y = 0;
18055009Sshin	if (x < sizeof(*mask)) {
18155009Sshin		for (y = 0; y < 8; y++) {
18255009Sshin			if ((p[x] & (0x80 >> y)) == 0)
18355009Sshin				break;
18455009Sshin		}
18555009Sshin	}
186184295Sbz	return (x * 8 + y);
18755009Sshin}
18855009Sshin
18955009Sshinstatic void
190169454Srwatsonin_len2mask(struct in_addr *mask, int len)
19155009Sshin{
19255009Sshin	int i;
19355009Sshin	u_char *p;
19455009Sshin
19555009Sshin	p = (u_char *)mask;
19655009Sshin	bzero(mask, sizeof(*mask));
19755009Sshin	for (i = 0; i < len / 8; i++)
19855009Sshin		p[i] = 0xff;
19955009Sshin	if (len % 8)
20055009Sshin		p[i] = (0xff00 >> (len % 8)) & 0xff;
20155009Sshin}
20255009Sshin
2031541Srgrimes/*
2041541Srgrimes * Generic internet control operations (ioctl's).
2051541Srgrimes * Ifp is 0 if not an interface-specific ioctl.
2061541Srgrimes */
2071541Srgrimes/* ARGSUSED */
2081549Srgrimesint
209169454Srwatsonin_control(struct socket *so, u_long cmd, caddr_t data, struct ifnet *ifp,
210169454Srwatson    struct thread *td)
2111541Srgrimes{
212183550Szec	INIT_VNET_INET(curvnet); /* both so and ifp can be NULL here! */
2131541Srgrimes	register struct ifreq *ifr = (struct ifreq *)data;
214184295Sbz	register struct in_ifaddr *ia, *iap;
2151541Srgrimes	register struct ifaddr *ifa;
216168032Sbms	struct in_addr allhosts_addr;
21784102Sjlemon	struct in_addr dst;
2181541Srgrimes	struct in_ifaddr *oia;
219189592Sbms	struct in_ifinfo *ii;
2201541Srgrimes	struct in_aliasreq *ifra = (struct in_aliasreq *)data;
2211541Srgrimes	struct sockaddr_in oldaddr;
22287124Sbrian	int error, hostIsNew, iaIsNew, maskIsNew, s;
223168032Sbms	int iaIsFirst;
2241541Srgrimes
225184295Sbz	ia = NULL;
226189592Sbms	ii = ((struct in_ifinfo *)ifp->if_afdata[AF_INET]);
227168032Sbms	iaIsFirst = 0;
22887124Sbrian	iaIsNew = 0;
229168032Sbms	allhosts_addr.s_addr = htonl(INADDR_ALLHOSTS_GROUP);
23087124Sbrian
23155009Sshin	switch (cmd) {
23255009Sshin	case SIOCALIFADDR:
233164033Srwatson		if (td != NULL) {
234164033Srwatson			error = priv_check(td, PRIV_NET_ADDIFADDR);
235164033Srwatson			if (error)
236164033Srwatson				return (error);
237164033Srwatson		}
238184295Sbz		if (ifp == NULL)
239184295Sbz			return (EINVAL);
240164033Srwatson		return in_lifaddr_ioctl(so, cmd, data, ifp, td);
241164033Srwatson
24255009Sshin	case SIOCDLIFADDR:
243164033Srwatson		if (td != NULL) {
244164033Srwatson			error = priv_check(td, PRIV_NET_DELIFADDR);
245164033Srwatson			if (error)
246164033Srwatson				return (error);
247164033Srwatson		}
248184295Sbz		if (ifp == NULL)
249184295Sbz			return (EINVAL);
250164033Srwatson		return in_lifaddr_ioctl(so, cmd, data, ifp, td);
251164033Srwatson
25255009Sshin	case SIOCGLIFADDR:
253184295Sbz		if (ifp == NULL)
254184295Sbz			return (EINVAL);
25583366Sjulian		return in_lifaddr_ioctl(so, cmd, data, ifp, td);
25655009Sshin	}
25755009Sshin
2581541Srgrimes	/*
2591541Srgrimes	 * Find address for this interface, if it exists.
26014632Sfenner	 *
26114632Sfenner	 * If an alias address was specified, find that one instead of
26284102Sjlemon	 * the first one on the interface, if possible.
2631541Srgrimes	 */
264184295Sbz	if (ifp != NULL) {
26584102Sjlemon		dst = ((struct sockaddr_in *)&ifr->ifr_addr)->sin_addr;
26684102Sjlemon		LIST_FOREACH(iap, INADDR_HASH(dst.s_addr), ia_hash)
26784102Sjlemon			if (iap->ia_ifp == ifp &&
26884102Sjlemon			    iap->ia_addr.sin_addr.s_addr == dst.s_addr) {
269186948Sbz				if (td == NULL || prison_check_ip4(
270188144Sjamie				    td->td_ucred, &dst) == 0)
271186948Sbz					ia = iap;
27284102Sjlemon				break;
27384102Sjlemon			}
27484102Sjlemon		if (ia == NULL)
27584102Sjlemon			TAILQ_FOREACH(ifa, &ifp->if_addrhead, ifa_link) {
27684102Sjlemon				iap = ifatoia(ifa);
27784102Sjlemon				if (iap->ia_addr.sin_family == AF_INET) {
278186948Sbz					if (td != NULL &&
279188144Sjamie					    prison_check_ip4(td->td_ucred,
280188144Sjamie					    &iap->ia_addr.sin_addr) != 0)
281186948Sbz						continue;
28214632Sfenner					ia = iap;
28314632Sfenner					break;
28414632Sfenner				}
28514632Sfenner			}
286168032Sbms		if (ia == NULL)
287168032Sbms			iaIsFirst = 1;
28884102Sjlemon	}
2891541Srgrimes
2901541Srgrimes	switch (cmd) {
2911541Srgrimes
2921541Srgrimes	case SIOCAIFADDR:
2931541Srgrimes	case SIOCDIFADDR:
294184295Sbz		if (ifp == NULL)
29541575Seivind			return (EADDRNOTAVAIL);
2968071Swollman		if (ifra->ifra_addr.sin_family == AF_INET) {
29771999Sphk			for (oia = ia; ia; ia = TAILQ_NEXT(ia, ia_link)) {
2988071Swollman				if (ia->ia_ifp == ifp  &&
2998071Swollman				    ia->ia_addr.sin_addr.s_addr ==
3008071Swollman				    ifra->ifra_addr.sin_addr.s_addr)
3018071Swollman					break;
3028071Swollman			}
3038876Srgrimes			if ((ifp->if_flags & IFF_POINTOPOINT)
3048071Swollman			    && (cmd == SIOCAIFADDR)
3058071Swollman			    && (ifra->ifra_dstaddr.sin_addr.s_addr
3068071Swollman				== INADDR_ANY)) {
307184295Sbz				return (EDESTADDRREQ);
3088071Swollman			}
3091541Srgrimes		}
310184295Sbz		if (cmd == SIOCDIFADDR && ia == NULL)
3111541Srgrimes			return (EADDRNOTAVAIL);
3121541Srgrimes		/* FALLTHROUGH */
3131541Srgrimes	case SIOCSIFADDR:
3141541Srgrimes	case SIOCSIFNETMASK:
3151541Srgrimes	case SIOCSIFDSTADDR:
316164033Srwatson		if (td != NULL) {
317175626Sbz			error = priv_check(td, (cmd == SIOCDIFADDR) ?
318175626Sbz			    PRIV_NET_DELIFADDR : PRIV_NET_ADDIFADDR);
319164033Srwatson			if (error)
320164033Srwatson				return (error);
321164033Srwatson		}
3221541Srgrimes
323184295Sbz		if (ifp == NULL)
32441575Seivind			return (EADDRNOTAVAIL);
325184295Sbz		if (ia == NULL) {
32620407Swollman			ia = (struct in_ifaddr *)
327111119Simp				malloc(sizeof *ia, M_IFADDR, M_WAITOK | M_ZERO);
328184295Sbz			if (ia == NULL)
3291541Srgrimes				return (ENOBUFS);
33015092Sdg			/*
33115092Sdg			 * Protect from ipintr() traversing address list
33215092Sdg			 * while we're modifying it.
33315092Sdg			 */
33415092Sdg			s = splnet();
33520407Swollman			ifa = &ia->ia_ifa;
336108033Shsu			IFA_LOCK_INIT(ifa);
33720407Swollman			ifa->ifa_addr = (struct sockaddr *)&ia->ia_addr;
33820407Swollman			ifa->ifa_dstaddr = (struct sockaddr *)&ia->ia_dstaddr;
33920407Swollman			ifa->ifa_netmask = (struct sockaddr *)&ia->ia_sockmask;
340108033Shsu			ifa->ifa_refcnt = 1;
341108033Shsu			TAILQ_INSERT_TAIL(&ifp->if_addrhead, ifa, ifa_link);
342108033Shsu
3431541Srgrimes			ia->ia_sockmask.sin_len = 8;
34485740Sdes			ia->ia_sockmask.sin_family = AF_INET;
3451541Srgrimes			if (ifp->if_flags & IFF_BROADCAST) {
3461541Srgrimes				ia->ia_broadaddr.sin_len = sizeof(ia->ia_addr);
3471541Srgrimes				ia->ia_broadaddr.sin_family = AF_INET;
3481541Srgrimes			}
3491541Srgrimes			ia->ia_ifp = ifp;
350151824Sglebius
351181803Sbz			TAILQ_INSERT_TAIL(&V_in_ifaddrhead, ia, ia_link);
35215092Sdg			splx(s);
35387124Sbrian			iaIsNew = 1;
3541541Srgrimes		}
3551541Srgrimes		break;
3561541Srgrimes
3571541Srgrimes	case SIOCSIFBRDADDR:
358164033Srwatson		if (td != NULL) {
359164033Srwatson			error = priv_check(td, PRIV_NET_ADDIFADDR);
360164033Srwatson			if (error)
361164033Srwatson				return (error);
362164033Srwatson		}
3631541Srgrimes		/* FALLTHROUGH */
3641541Srgrimes
3651541Srgrimes	case SIOCGIFADDR:
3661541Srgrimes	case SIOCGIFNETMASK:
3671541Srgrimes	case SIOCGIFDSTADDR:
3681541Srgrimes	case SIOCGIFBRDADDR:
369184295Sbz		if (ia == NULL)
3701541Srgrimes			return (EADDRNOTAVAIL);
3711541Srgrimes		break;
3721541Srgrimes	}
3731541Srgrimes	switch (cmd) {
3741541Srgrimes
3751541Srgrimes	case SIOCGIFADDR:
3761541Srgrimes		*((struct sockaddr_in *)&ifr->ifr_addr) = ia->ia_addr;
37787124Sbrian		return (0);
3781541Srgrimes
3791541Srgrimes	case SIOCGIFBRDADDR:
3801541Srgrimes		if ((ifp->if_flags & IFF_BROADCAST) == 0)
3811541Srgrimes			return (EINVAL);
3821541Srgrimes		*((struct sockaddr_in *)&ifr->ifr_dstaddr) = ia->ia_broadaddr;
38387124Sbrian		return (0);
3841541Srgrimes
3851541Srgrimes	case SIOCGIFDSTADDR:
3861541Srgrimes		if ((ifp->if_flags & IFF_POINTOPOINT) == 0)
3871541Srgrimes			return (EINVAL);
3881541Srgrimes		*((struct sockaddr_in *)&ifr->ifr_dstaddr) = ia->ia_dstaddr;
38987124Sbrian		return (0);
3901541Srgrimes
3911541Srgrimes	case SIOCGIFNETMASK:
3921541Srgrimes		*((struct sockaddr_in *)&ifr->ifr_addr) = ia->ia_sockmask;
39387124Sbrian		return (0);
3941541Srgrimes
3951541Srgrimes	case SIOCSIFDSTADDR:
3961541Srgrimes		if ((ifp->if_flags & IFF_POINTOPOINT) == 0)
3971541Srgrimes			return (EINVAL);
3981541Srgrimes		oldaddr = ia->ia_dstaddr;
3991541Srgrimes		ia->ia_dstaddr = *(struct sockaddr_in *)&ifr->ifr_dstaddr;
400184295Sbz		if (ifp->if_ioctl != NULL) {
401146883Siedowse			IFF_LOCKGIANT(ifp);
402146883Siedowse			error = (*ifp->if_ioctl)(ifp, SIOCSIFDSTADDR,
403146883Siedowse			    (caddr_t)ia);
404146883Siedowse			IFF_UNLOCKGIANT(ifp);
405146883Siedowse			if (error) {
406146883Siedowse				ia->ia_dstaddr = oldaddr;
407146883Siedowse				return (error);
408146883Siedowse			}
4091541Srgrimes		}
4101541Srgrimes		if (ia->ia_flags & IFA_ROUTE) {
4111541Srgrimes			ia->ia_ifa.ifa_dstaddr = (struct sockaddr *)&oldaddr;
4121541Srgrimes			rtinit(&(ia->ia_ifa), (int)RTM_DELETE, RTF_HOST);
4131541Srgrimes			ia->ia_ifa.ifa_dstaddr =
4141541Srgrimes					(struct sockaddr *)&ia->ia_dstaddr;
4151541Srgrimes			rtinit(&(ia->ia_ifa), (int)RTM_ADD, RTF_HOST|RTF_UP);
4161541Srgrimes		}
41787124Sbrian		return (0);
4181541Srgrimes
4191541Srgrimes	case SIOCSIFBRDADDR:
4201541Srgrimes		if ((ifp->if_flags & IFF_BROADCAST) == 0)
4211541Srgrimes			return (EINVAL);
4221541Srgrimes		ia->ia_broadaddr = *(struct sockaddr_in *)&ifr->ifr_broadaddr;
42387124Sbrian		return (0);
4241541Srgrimes
4251541Srgrimes	case SIOCSIFADDR:
42687124Sbrian		error = in_ifinit(ifp, ia,
42787124Sbrian		    (struct sockaddr_in *) &ifr->ifr_addr, 1);
42887124Sbrian		if (error != 0 && iaIsNew)
42987124Sbrian			break;
430168032Sbms		if (error == 0) {
431189592Sbms			if (iaIsFirst &&
432189592Sbms			    (ifp->if_flags & IFF_MULTICAST) != 0) {
433189592Sbms				error = in_joingroup(ifp, &allhosts_addr,
434189592Sbms				    NULL, &ii->ii_allhosts);
435189592Sbms			}
436126264Smlaier			EVENTHANDLER_INVOKE(ifaddr_event, ifp);
437168032Sbms		}
43887124Sbrian		return (0);
4391541Srgrimes
4401541Srgrimes	case SIOCSIFNETMASK:
44185740Sdes		ia->ia_sockmask.sin_addr = ifra->ifra_addr.sin_addr;
44285740Sdes		ia->ia_subnetmask = ntohl(ia->ia_sockmask.sin_addr.s_addr);
44387124Sbrian		return (0);
4441541Srgrimes
4451541Srgrimes	case SIOCAIFADDR:
4461541Srgrimes		maskIsNew = 0;
4471541Srgrimes		hostIsNew = 1;
4481541Srgrimes		error = 0;
4491541Srgrimes		if (ia->ia_addr.sin_family == AF_INET) {
4501541Srgrimes			if (ifra->ifra_addr.sin_len == 0) {
4511541Srgrimes				ifra->ifra_addr = ia->ia_addr;
4521541Srgrimes				hostIsNew = 0;
4531541Srgrimes			} else if (ifra->ifra_addr.sin_addr.s_addr ==
4541541Srgrimes					       ia->ia_addr.sin_addr.s_addr)
4551541Srgrimes				hostIsNew = 0;
4561541Srgrimes		}
4571541Srgrimes		if (ifra->ifra_mask.sin_len) {
4581541Srgrimes			in_ifscrub(ifp, ia);
4591541Srgrimes			ia->ia_sockmask = ifra->ifra_mask;
46085740Sdes			ia->ia_sockmask.sin_family = AF_INET;
4611541Srgrimes			ia->ia_subnetmask =
4621541Srgrimes			     ntohl(ia->ia_sockmask.sin_addr.s_addr);
4631541Srgrimes			maskIsNew = 1;
4641541Srgrimes		}
4651541Srgrimes		if ((ifp->if_flags & IFF_POINTOPOINT) &&
4661541Srgrimes		    (ifra->ifra_dstaddr.sin_family == AF_INET)) {
4671541Srgrimes			in_ifscrub(ifp, ia);
4681541Srgrimes			ia->ia_dstaddr = ifra->ifra_dstaddr;
4691541Srgrimes			maskIsNew  = 1; /* We lie; but the effect's the same */
4701541Srgrimes		}
4711541Srgrimes		if (ifra->ifra_addr.sin_family == AF_INET &&
4721541Srgrimes		    (hostIsNew || maskIsNew))
4731541Srgrimes			error = in_ifinit(ifp, ia, &ifra->ifra_addr, 0);
47487124Sbrian		if (error != 0 && iaIsNew)
47587124Sbrian			break;
47687124Sbrian
4771541Srgrimes		if ((ifp->if_flags & IFF_BROADCAST) &&
4781541Srgrimes		    (ifra->ifra_broadaddr.sin_family == AF_INET))
4791541Srgrimes			ia->ia_broadaddr = ifra->ifra_broadaddr;
480168032Sbms		if (error == 0) {
481189592Sbms			if (iaIsFirst &&
482189592Sbms			    (ifp->if_flags & IFF_MULTICAST) != 0) {
483189592Sbms				error = in_joingroup(ifp, &allhosts_addr,
484189592Sbms				    NULL, &ii->ii_allhosts);
485189592Sbms			}
486126264Smlaier			EVENTHANDLER_INVOKE(ifaddr_event, ifp);
487168032Sbms		}
4881541Srgrimes		return (error);
4891541Srgrimes
4901541Srgrimes	case SIOCDIFADDR:
49174299Sru		/*
49274299Sru		 * in_ifscrub kills the interface route.
49374299Sru		 */
4941541Srgrimes		in_ifscrub(ifp, ia);
49515092Sdg		/*
49674299Sru		 * in_ifadown gets rid of all the rest of
49774299Sru		 * the routes.  This is not quite the right
49874299Sru		 * thing to do, but at least if we are running
49974299Sru		 * a routing process they will come back.
50074299Sru		 */
50176469Sru		in_ifadown(&ia->ia_ifa, 1);
502126264Smlaier		EVENTHANDLER_INVOKE(ifaddr_event, ifp);
50387124Sbrian		error = 0;
5041541Srgrimes		break;
5051541Srgrimes
5061541Srgrimes	default:
507184295Sbz		if (ifp == NULL || ifp->if_ioctl == NULL)
5081541Srgrimes			return (EOPNOTSUPP);
509146883Siedowse		IFF_LOCKGIANT(ifp);
510146883Siedowse		error = (*ifp->if_ioctl)(ifp, cmd, data);
511146883Siedowse		IFF_UNLOCKGIANT(ifp);
512146883Siedowse		return (error);
5131541Srgrimes	}
51487124Sbrian
51587124Sbrian	/*
51687124Sbrian	 * Protect from ipintr() traversing address list while we're modifying
51787124Sbrian	 * it.
51887124Sbrian	 */
51987124Sbrian	s = splnet();
52087124Sbrian	TAILQ_REMOVE(&ifp->if_addrhead, &ia->ia_ifa, ifa_link);
521181803Sbz	TAILQ_REMOVE(&V_in_ifaddrhead, ia, ia_link);
522168032Sbms	if (ia->ia_addr.sin_family == AF_INET) {
523154777Sandre		LIST_REMOVE(ia, ia_hash);
524168032Sbms		/*
525168032Sbms		 * If this is the last IPv4 address configured on this
526168032Sbms		 * interface, leave the all-hosts group.
527189592Sbms		 * No state-change report need be transmitted.
528168032Sbms		 */
529168032Sbms		oia = NULL;
530168032Sbms		IFP_TO_IA(ifp, oia);
531168032Sbms		if (oia == NULL) {
532168032Sbms			IFF_LOCKGIANT(ifp);
533168032Sbms			IN_MULTI_LOCK();
534189592Sbms			if (ii->ii_allhosts) {
535189592Sbms				(void)in_leavegroup_locked(ii->ii_allhosts,
536189592Sbms				    NULL);
537189592Sbms				ii->ii_allhosts = NULL;
538189592Sbms			}
539168032Sbms			IN_MULTI_UNLOCK();
540168032Sbms			IFF_UNLOCKGIANT(ifp);
541168032Sbms		}
542168032Sbms	}
54387124Sbrian	IFAFREE(&ia->ia_ifa);
54487124Sbrian	splx(s);
54587124Sbrian
54687124Sbrian	return (error);
5471541Srgrimes}
5481541Srgrimes
5491541Srgrimes/*
55055009Sshin * SIOC[GAD]LIFADDR.
55155009Sshin *	SIOCGLIFADDR: get first address. (?!?)
55255009Sshin *	SIOCGLIFADDR with IFLR_PREFIX:
55355009Sshin *		get first address that matches the specified prefix.
55455009Sshin *	SIOCALIFADDR: add the specified address.
55555009Sshin *	SIOCALIFADDR with IFLR_PREFIX:
55655009Sshin *		EINVAL since we can't deduce hostid part of the address.
55755009Sshin *	SIOCDLIFADDR: delete the specified address.
55855009Sshin *	SIOCDLIFADDR with IFLR_PREFIX:
55955009Sshin *		delete the first address that matches the specified prefix.
56055009Sshin * return values:
56155009Sshin *	EINVAL on invalid parameters
56255009Sshin *	EADDRNOTAVAIL on prefix match failed/specified address not found
56355009Sshin *	other values may be returned from in_ioctl()
56455009Sshin */
56555009Sshinstatic int
566169454Srwatsonin_lifaddr_ioctl(struct socket *so, u_long cmd, caddr_t data,
567169454Srwatson    struct ifnet *ifp, struct thread *td)
56855009Sshin{
56955009Sshin	struct if_laddrreq *iflr = (struct if_laddrreq *)data;
57055009Sshin	struct ifaddr *ifa;
57155009Sshin
57255009Sshin	/* sanity checks */
573184295Sbz	if (data == NULL || ifp == NULL) {
57455009Sshin		panic("invalid argument to in_lifaddr_ioctl");
57555009Sshin		/*NOTRECHED*/
57655009Sshin	}
57755009Sshin
57855009Sshin	switch (cmd) {
57955009Sshin	case SIOCGLIFADDR:
58055009Sshin		/* address must be specified on GET with IFLR_PREFIX */
58155009Sshin		if ((iflr->flags & IFLR_PREFIX) == 0)
58255009Sshin			break;
58355009Sshin		/*FALLTHROUGH*/
58455009Sshin	case SIOCALIFADDR:
58555009Sshin	case SIOCDLIFADDR:
58655009Sshin		/* address must be specified on ADD and DELETE */
58755917Sshin		if (iflr->addr.ss_family != AF_INET)
588184295Sbz			return (EINVAL);
58955917Sshin		if (iflr->addr.ss_len != sizeof(struct sockaddr_in))
590184295Sbz			return (EINVAL);
59155009Sshin		/* XXX need improvement */
59255917Sshin		if (iflr->dstaddr.ss_family
59355917Sshin		 && iflr->dstaddr.ss_family != AF_INET)
594184295Sbz			return (EINVAL);
59555917Sshin		if (iflr->dstaddr.ss_family
59655917Sshin		 && iflr->dstaddr.ss_len != sizeof(struct sockaddr_in))
597184295Sbz			return (EINVAL);
59855009Sshin		break;
59955009Sshin	default: /*shouldn't happen*/
600184295Sbz		return (EOPNOTSUPP);
60155009Sshin	}
60255009Sshin	if (sizeof(struct in_addr) * 8 < iflr->prefixlen)
603184295Sbz		return (EINVAL);
60455009Sshin
60555009Sshin	switch (cmd) {
60655009Sshin	case SIOCALIFADDR:
60755009Sshin	    {
60855009Sshin		struct in_aliasreq ifra;
60955009Sshin
61055009Sshin		if (iflr->flags & IFLR_PREFIX)
611184295Sbz			return (EINVAL);
61255009Sshin
61355009Sshin		/* copy args to in_aliasreq, perform ioctl(SIOCAIFADDR_IN6). */
61455009Sshin		bzero(&ifra, sizeof(ifra));
61555009Sshin		bcopy(iflr->iflr_name, ifra.ifra_name,
61655009Sshin			sizeof(ifra.ifra_name));
61755009Sshin
61855917Sshin		bcopy(&iflr->addr, &ifra.ifra_addr, iflr->addr.ss_len);
61955009Sshin
62055917Sshin		if (iflr->dstaddr.ss_family) {	/*XXX*/
62155009Sshin			bcopy(&iflr->dstaddr, &ifra.ifra_dstaddr,
62255917Sshin				iflr->dstaddr.ss_len);
62355009Sshin		}
62455009Sshin
62555009Sshin		ifra.ifra_mask.sin_family = AF_INET;
62655009Sshin		ifra.ifra_mask.sin_len = sizeof(struct sockaddr_in);
62755009Sshin		in_len2mask(&ifra.ifra_mask.sin_addr, iflr->prefixlen);
62855009Sshin
629184295Sbz		return (in_control(so, SIOCAIFADDR, (caddr_t)&ifra, ifp, td));
63055009Sshin	    }
63155009Sshin	case SIOCGLIFADDR:
63255009Sshin	case SIOCDLIFADDR:
63355009Sshin	    {
63455009Sshin		struct in_ifaddr *ia;
63555009Sshin		struct in_addr mask, candidate, match;
63655009Sshin		struct sockaddr_in *sin;
63755009Sshin
63855009Sshin		bzero(&mask, sizeof(mask));
639170855Smjacob		bzero(&match, sizeof(match));
64055009Sshin		if (iflr->flags & IFLR_PREFIX) {
64155009Sshin			/* lookup a prefix rather than address. */
64255009Sshin			in_len2mask(&mask, iflr->prefixlen);
64355009Sshin
64455009Sshin			sin = (struct sockaddr_in *)&iflr->addr;
64555009Sshin			match.s_addr = sin->sin_addr.s_addr;
64655009Sshin			match.s_addr &= mask.s_addr;
64755009Sshin
64855009Sshin			/* if you set extra bits, that's wrong */
64955009Sshin			if (match.s_addr != sin->sin_addr.s_addr)
650184295Sbz				return (EINVAL);
65155009Sshin
65255009Sshin		} else {
653170855Smjacob			/* on getting an address, take the 1st match */
654170855Smjacob			/* on deleting an address, do exact match */
655170855Smjacob			if (cmd != SIOCGLIFADDR) {
65655009Sshin				in_len2mask(&mask, 32);
65755009Sshin				sin = (struct sockaddr_in *)&iflr->addr;
65855009Sshin				match.s_addr = sin->sin_addr.s_addr;
65955009Sshin			}
66055009Sshin		}
66155009Sshin
66255009Sshin		TAILQ_FOREACH(ifa, &ifp->if_addrhead, ifa_link)	{
66355009Sshin			if (ifa->ifa_addr->sa_family != AF_INET6)
66455009Sshin				continue;
665170855Smjacob			if (match.s_addr == 0)
66655009Sshin				break;
66755009Sshin			candidate.s_addr = ((struct sockaddr_in *)&ifa->ifa_addr)->sin_addr.s_addr;
66855009Sshin			candidate.s_addr &= mask.s_addr;
66955009Sshin			if (candidate.s_addr == match.s_addr)
67055009Sshin				break;
67155009Sshin		}
672184295Sbz		if (ifa == NULL)
673184295Sbz			return (EADDRNOTAVAIL);
67455009Sshin		ia = (struct in_ifaddr *)ifa;
67555009Sshin
67655009Sshin		if (cmd == SIOCGLIFADDR) {
67755009Sshin			/* fill in the if_laddrreq structure */
67855009Sshin			bcopy(&ia->ia_addr, &iflr->addr, ia->ia_addr.sin_len);
67955009Sshin
68055009Sshin			if ((ifp->if_flags & IFF_POINTOPOINT) != 0) {
68155009Sshin				bcopy(&ia->ia_dstaddr, &iflr->dstaddr,
68255009Sshin					ia->ia_dstaddr.sin_len);
68355009Sshin			} else
68455009Sshin				bzero(&iflr->dstaddr, sizeof(iflr->dstaddr));
68555009Sshin
68655009Sshin			iflr->prefixlen =
68755009Sshin				in_mask2len(&ia->ia_sockmask.sin_addr);
68855009Sshin
68955009Sshin			iflr->flags = 0;	/*XXX*/
69055009Sshin
691184295Sbz			return (0);
69255009Sshin		} else {
69355009Sshin			struct in_aliasreq ifra;
69455009Sshin
69555009Sshin			/* fill in_aliasreq and do ioctl(SIOCDIFADDR_IN6) */
69655009Sshin			bzero(&ifra, sizeof(ifra));
69755009Sshin			bcopy(iflr->iflr_name, ifra.ifra_name,
69855009Sshin				sizeof(ifra.ifra_name));
69955009Sshin
70055009Sshin			bcopy(&ia->ia_addr, &ifra.ifra_addr,
70155009Sshin				ia->ia_addr.sin_len);
70255009Sshin			if ((ifp->if_flags & IFF_POINTOPOINT) != 0) {
70355009Sshin				bcopy(&ia->ia_dstaddr, &ifra.ifra_dstaddr,
70455009Sshin					ia->ia_dstaddr.sin_len);
70555009Sshin			}
70655009Sshin			bcopy(&ia->ia_sockmask, &ifra.ifra_dstaddr,
70755009Sshin				ia->ia_sockmask.sin_len);
70855009Sshin
709184295Sbz			return (in_control(so, SIOCDIFADDR, (caddr_t)&ifra,
710184295Sbz			    ifp, td));
71155009Sshin		}
71255009Sshin	    }
71355009Sshin	}
71455009Sshin
715184295Sbz	return (EOPNOTSUPP);	/*just for safety*/
71655009Sshin}
71755009Sshin
71855009Sshin/*
7191541Srgrimes * Delete any existing route for an interface.
7201541Srgrimes */
72122672Swollmanvoid
722169454Srwatsonin_ifscrub(struct ifnet *ifp, struct in_ifaddr *ia)
7231541Srgrimes{
724169454Srwatson
725137628Smlaier	in_scrubprefix(ia);
7261541Srgrimes}
7271541Srgrimes
7281541Srgrimes/*
7291541Srgrimes * Initialize an interface's internet address
7301541Srgrimes * and routing table entry.
7311541Srgrimes */
73212296Sphkstatic int
733169454Srwatsonin_ifinit(struct ifnet *ifp, struct in_ifaddr *ia, struct sockaddr_in *sin,
734169454Srwatson    int scrub)
7351541Srgrimes{
736183550Szec	INIT_VNET_INET(ifp->if_vnet);
7371541Srgrimes	register u_long i = ntohl(sin->sin_addr.s_addr);
7381541Srgrimes	struct sockaddr_in oldaddr;
73994326Sbrian	int s = splimp(), flags = RTF_UP, error = 0;
7401541Srgrimes
7411541Srgrimes	oldaddr = ia->ia_addr;
742105748Ssuz	if (oldaddr.sin_family == AF_INET)
743105748Ssuz		LIST_REMOVE(ia, ia_hash);
7441541Srgrimes	ia->ia_addr = *sin;
745105748Ssuz	if (ia->ia_addr.sin_family == AF_INET)
746105748Ssuz		LIST_INSERT_HEAD(INADDR_HASH(ia->ia_addr.sin_addr.s_addr),
747105748Ssuz		    ia, ia_hash);
7481541Srgrimes	/*
7491541Srgrimes	 * Give the interface a chance to initialize
7501541Srgrimes	 * if this is its first address,
7511541Srgrimes	 * and to validate the address if necessary.
7521541Srgrimes	 */
753184295Sbz	if (ifp->if_ioctl != NULL) {
754146883Siedowse		IFF_LOCKGIANT(ifp);
755146883Siedowse		error = (*ifp->if_ioctl)(ifp, SIOCSIFADDR, (caddr_t)ia);
756146883Siedowse		IFF_UNLOCKGIANT(ifp);
757146883Siedowse		if (error) {
758146883Siedowse			splx(s);
759146883Siedowse			/* LIST_REMOVE(ia, ia_hash) is done in in_control */
760146883Siedowse			ia->ia_addr = oldaddr;
761146883Siedowse			if (ia->ia_addr.sin_family == AF_INET)
762146883Siedowse				LIST_INSERT_HEAD(INADDR_HASH(
763146883Siedowse				    ia->ia_addr.sin_addr.s_addr), ia, ia_hash);
764179971Sgonzo			else
765179971Sgonzo				/*
766179971Sgonzo				 * If oldaddr family is not AF_INET (e.g.
767179971Sgonzo				 * interface has been just created) in_control
768179971Sgonzo				 * does not call LIST_REMOVE, and we end up
769179971Sgonzo				 * with bogus ia entries in hash
770179971Sgonzo				 */
771179971Sgonzo				LIST_REMOVE(ia, ia_hash);
772146883Siedowse			return (error);
773146883Siedowse		}
7741541Srgrimes	}
7751541Srgrimes	splx(s);
7761541Srgrimes	if (scrub) {
7771541Srgrimes		ia->ia_ifa.ifa_addr = (struct sockaddr *)&oldaddr;
7781541Srgrimes		in_ifscrub(ifp, ia);
7791541Srgrimes		ia->ia_ifa.ifa_addr = (struct sockaddr *)&ia->ia_addr;
7801541Srgrimes	}
7811541Srgrimes	if (IN_CLASSA(i))
7821541Srgrimes		ia->ia_netmask = IN_CLASSA_NET;
7831541Srgrimes	else if (IN_CLASSB(i))
7841541Srgrimes		ia->ia_netmask = IN_CLASSB_NET;
7851541Srgrimes	else
7861541Srgrimes		ia->ia_netmask = IN_CLASSC_NET;
7871541Srgrimes	/*
7881541Srgrimes	 * The subnet mask usually includes at least the standard network part,
7891541Srgrimes	 * but may may be smaller in the case of supernetting.
7901541Srgrimes	 * If it is set, we believe it.
7911541Srgrimes	 */
7921541Srgrimes	if (ia->ia_subnetmask == 0) {
7931541Srgrimes		ia->ia_subnetmask = ia->ia_netmask;
7941541Srgrimes		ia->ia_sockmask.sin_addr.s_addr = htonl(ia->ia_subnetmask);
7951541Srgrimes	} else
7961541Srgrimes		ia->ia_netmask &= ia->ia_subnetmask;
7971541Srgrimes	ia->ia_net = i & ia->ia_netmask;
7981541Srgrimes	ia->ia_subnet = i & ia->ia_subnetmask;
7991541Srgrimes	in_socktrim(&ia->ia_sockmask);
800143868Sglebius#ifdef DEV_CARP
8011541Srgrimes	/*
802143868Sglebius	 * XXX: carp(4) does not have interface route
803143868Sglebius	 */
804143868Sglebius	if (ifp->if_type == IFT_CARP)
805143868Sglebius		return (0);
806143868Sglebius#endif
807143868Sglebius	/*
8081541Srgrimes	 * Add route for the network.
8091541Srgrimes	 */
8101541Srgrimes	ia->ia_ifa.ifa_metric = ifp->if_metric;
8111541Srgrimes	if (ifp->if_flags & IFF_BROADCAST) {
8121541Srgrimes		ia->ia_broadaddr.sin_addr.s_addr =
8131541Srgrimes			htonl(ia->ia_subnet | ~ia->ia_subnetmask);
8141541Srgrimes		ia->ia_netbroadcast.s_addr =
8151541Srgrimes			htonl(ia->ia_net | ~ ia->ia_netmask);
8161541Srgrimes	} else if (ifp->if_flags & IFF_LOOPBACK) {
817137833Smlaier		ia->ia_dstaddr = ia->ia_addr;
8181541Srgrimes		flags |= RTF_HOST;
8191541Srgrimes	} else if (ifp->if_flags & IFF_POINTOPOINT) {
8201541Srgrimes		if (ia->ia_dstaddr.sin_family != AF_INET)
8211541Srgrimes			return (0);
8221541Srgrimes		flags |= RTF_HOST;
8231541Srgrimes	}
824137628Smlaier	if ((error = in_addprefix(ia, flags)) != 0)
825137628Smlaier		return (error);
82694326Sbrian
8271541Srgrimes	return (error);
8281541Srgrimes}
8291541Srgrimes
830137628Smlaier#define rtinitflags(x) \
831137628Smlaier	((((x)->ia_ifp->if_flags & (IFF_LOOPBACK | IFF_POINTOPOINT)) != 0) \
832137628Smlaier	    ? RTF_HOST : 0)
833137628Smlaier/*
834170855Smjacob * Check if we have a route for the given prefix already or add one accordingly.
835137628Smlaier */
836137628Smlaierstatic int
837169454Srwatsonin_addprefix(struct in_ifaddr *target, int flags)
838137628Smlaier{
839183550Szec	INIT_VNET_INET(curvnet);
840137628Smlaier	struct in_ifaddr *ia;
841151555Sglebius	struct in_addr prefix, mask, p, m;
842137628Smlaier	int error;
8431541Srgrimes
844170855Smjacob	if ((flags & RTF_HOST) != 0) {
845137628Smlaier		prefix = target->ia_dstaddr.sin_addr;
846170855Smjacob		mask.s_addr = 0;
847170855Smjacob	} else {
848137628Smlaier		prefix = target->ia_addr.sin_addr;
849137628Smlaier		mask = target->ia_sockmask.sin_addr;
850137628Smlaier		prefix.s_addr &= mask.s_addr;
851137628Smlaier	}
852137628Smlaier
853181803Sbz	TAILQ_FOREACH(ia, &V_in_ifaddrhead, ia_link) {
854151555Sglebius		if (rtinitflags(ia)) {
855137628Smlaier			p = ia->ia_addr.sin_addr;
856151555Sglebius
857151555Sglebius			if (prefix.s_addr != p.s_addr)
858151555Sglebius				continue;
859151555Sglebius		} else {
860151555Sglebius			p = ia->ia_addr.sin_addr;
861151555Sglebius			m = ia->ia_sockmask.sin_addr;
862151555Sglebius			p.s_addr &= m.s_addr;
863151555Sglebius
864151555Sglebius			if (prefix.s_addr != p.s_addr ||
865151555Sglebius			    mask.s_addr != m.s_addr)
866151555Sglebius				continue;
867137628Smlaier		}
868137628Smlaier
869137628Smlaier		/*
870137628Smlaier		 * If we got a matching prefix route inserted by other
871137628Smlaier		 * interface address, we are done here.
872137628Smlaier		 */
873149221Sglebius		if (ia->ia_flags & IFA_ROUTE) {
874181803Sbz			if (V_sameprefixcarponly &&
875149221Sglebius			    target->ia_ifp->if_type != IFT_CARP &&
876149221Sglebius			    ia->ia_ifp->if_type != IFT_CARP)
877149221Sglebius				return (EEXIST);
878149221Sglebius			else
879149221Sglebius				return (0);
880149221Sglebius		}
881137628Smlaier	}
882137628Smlaier
883137628Smlaier	/*
884137628Smlaier	 * No-one seem to have this prefix route, so we try to insert it.
885137628Smlaier	 */
886137628Smlaier	error = rtinit(&target->ia_ifa, (int)RTM_ADD, flags);
887137628Smlaier	if (!error)
888137628Smlaier		target->ia_flags |= IFA_ROUTE;
889184295Sbz	return (error);
890137628Smlaier}
891137628Smlaier
892186119Sqingliextern void arp_ifscrub(struct ifnet *ifp, uint32_t addr);
893186119Sqingli
8941541Srgrimes/*
895137628Smlaier * If there is no other address in the system that can serve a route to the
896137628Smlaier * same prefix, remove the route.  Hand over the route to the new address
897137628Smlaier * otherwise.
898137628Smlaier */
899137628Smlaierstatic int
900169454Srwatsonin_scrubprefix(struct in_ifaddr *target)
901137628Smlaier{
902183550Szec	INIT_VNET_INET(curvnet);
903137628Smlaier	struct in_ifaddr *ia;
904137628Smlaier	struct in_addr prefix, mask, p;
905137628Smlaier	int error;
906137628Smlaier
907137628Smlaier	if ((target->ia_flags & IFA_ROUTE) == 0)
908184295Sbz		return (0);
909137628Smlaier
910137628Smlaier	if (rtinitflags(target))
911137628Smlaier		prefix = target->ia_dstaddr.sin_addr;
912137628Smlaier	else {
913137628Smlaier		prefix = target->ia_addr.sin_addr;
914137628Smlaier		mask = target->ia_sockmask.sin_addr;
915137628Smlaier		prefix.s_addr &= mask.s_addr;
916186119Sqingli		/* remove arp cache */
917186119Sqingli		arp_ifscrub(target->ia_ifp, IA_SIN(target)->sin_addr.s_addr);
918137628Smlaier	}
919137628Smlaier
920181803Sbz	TAILQ_FOREACH(ia, &V_in_ifaddrhead, ia_link) {
921137628Smlaier		if (rtinitflags(ia))
922137628Smlaier			p = ia->ia_dstaddr.sin_addr;
923137628Smlaier		else {
924137628Smlaier			p = ia->ia_addr.sin_addr;
925137628Smlaier			p.s_addr &= ia->ia_sockmask.sin_addr.s_addr;
926137628Smlaier		}
927137628Smlaier
928137628Smlaier		if (prefix.s_addr != p.s_addr)
929137628Smlaier			continue;
930137628Smlaier
931137628Smlaier		/*
932137628Smlaier		 * If we got a matching prefix address, move IFA_ROUTE and
933137628Smlaier		 * the route itself to it.  Make sure that routing daemons
934137628Smlaier		 * get a heads-up.
935143868Sglebius		 *
936143868Sglebius		 * XXX: a special case for carp(4) interface
937137628Smlaier		 */
938143868Sglebius		if ((ia->ia_flags & IFA_ROUTE) == 0
939143868Sglebius#ifdef DEV_CARP
940143868Sglebius		    && (ia->ia_ifp->if_type != IFT_CARP)
941143868Sglebius#endif
942143868Sglebius							) {
943137628Smlaier			rtinit(&(target->ia_ifa), (int)RTM_DELETE,
944137628Smlaier			    rtinitflags(target));
945137628Smlaier			target->ia_flags &= ~IFA_ROUTE;
946137628Smlaier
947137628Smlaier			error = rtinit(&ia->ia_ifa, (int)RTM_ADD,
948137628Smlaier			    rtinitflags(ia) | RTF_UP);
949137628Smlaier			if (error == 0)
950137628Smlaier				ia->ia_flags |= IFA_ROUTE;
951184295Sbz			return (error);
952137628Smlaier		}
953137628Smlaier	}
954137628Smlaier
955137628Smlaier	/*
956137628Smlaier	 * As no-one seem to have this prefix, we can remove the route.
957137628Smlaier	 */
958137628Smlaier	rtinit(&(target->ia_ifa), (int)RTM_DELETE, rtinitflags(target));
959137628Smlaier	target->ia_flags &= ~IFA_ROUTE;
960184295Sbz	return (0);
961137628Smlaier}
962137628Smlaier
963137628Smlaier#undef rtinitflags
964137628Smlaier
965137628Smlaier/*
9661541Srgrimes * Return 1 if the address might be a local broadcast address.
9671541Srgrimes */
9681549Srgrimesint
969169454Srwatsonin_broadcast(struct in_addr in, struct ifnet *ifp)
9701541Srgrimes{
9711541Srgrimes	register struct ifaddr *ifa;
9721541Srgrimes	u_long t;
9731541Srgrimes
9741541Srgrimes	if (in.s_addr == INADDR_BROADCAST ||
9751541Srgrimes	    in.s_addr == INADDR_ANY)
976184295Sbz		return (1);
9771541Srgrimes	if ((ifp->if_flags & IFF_BROADCAST) == 0)
978184295Sbz		return (0);
9791541Srgrimes	t = ntohl(in.s_addr);
9801541Srgrimes	/*
9811541Srgrimes	 * Look through the list of addresses for a match
9821541Srgrimes	 * with a broadcast address.
9831541Srgrimes	 */
9841541Srgrimes#define ia ((struct in_ifaddr *)ifa)
98574362Sphk	TAILQ_FOREACH(ifa, &ifp->if_addrhead, ifa_link)
9861541Srgrimes		if (ifa->ifa_addr->sa_family == AF_INET &&
9871541Srgrimes		    (in.s_addr == ia->ia_broadaddr.sin_addr.s_addr ||
9881541Srgrimes		     in.s_addr == ia->ia_netbroadcast.s_addr ||
9891541Srgrimes		     /*
9901541Srgrimes		      * Check for old-style (host 0) broadcast.
9911541Srgrimes		      */
99213351Sguido		     t == ia->ia_subnet || t == ia->ia_net) &&
99313351Sguido		     /*
99413351Sguido		      * Check for an all one subnetmask. These
99513351Sguido		      * only exist when an interface gets a secondary
99613351Sguido		      * address.
99713351Sguido		      */
99813351Sguido		     ia->ia_subnetmask != (u_long)0xffffffff)
999184295Sbz			    return (1);
10001541Srgrimes	return (0);
10011541Srgrimes#undef ia
10021541Srgrimes}
1003167729Sbms
10041541Srgrimes/*
1005189592Sbms * On interface removal, clean up IPv4 data structures hung off of the ifnet.
1006189592Sbms */
1007189592Sbmsvoid
1008189592Sbmsin_ifdetach(struct ifnet *ifp)
1009189592Sbms{
1010189592Sbms	INIT_VNET_INET(ifp->if_vnet);
1011189592Sbms
1012189592Sbms	in_pcbpurgeif0(&V_ripcbinfo, ifp);
1013189592Sbms	in_pcbpurgeif0(&V_udbinfo, ifp);
1014189592Sbms	in_purgemaddrs(ifp);
1015189592Sbms}
1016189592Sbms
1017189592Sbms/*
1018167729Sbms * Delete all IPv4 multicast address records, and associated link-layer
1019167729Sbms * multicast address records, associated with ifp.
1020189592Sbms * XXX It looks like domifdetach runs AFTER the link layer cleanup.
1021162718Sbms */
1022167729Sbmsstatic void
1023167729Sbmsin_purgemaddrs(struct ifnet *ifp)
1024162718Sbms{
1025183550Szec	INIT_VNET_INET(ifp->if_vnet);
1026189592Sbms	LIST_HEAD(,in_multi) purgeinms;
1027189592Sbms	struct in_multi		*inm, *tinm;
1028189592Sbms	struct ifmultiaddr	*ifma;
1029162718Sbms
1030189592Sbms	LIST_INIT(&purgeinms);
1031162718Sbms	IN_MULTI_LOCK();
1032189592Sbms
1033189592Sbms	/*
1034189592Sbms	 * Extract list of in_multi associated with the detaching ifp
1035189592Sbms	 * which the PF_INET layer is about to release.
1036189592Sbms	 * We need to do this as IF_ADDR_LOCK() may be re-acquired
1037189592Sbms	 * by code further down.
1038189592Sbms	 */
1039189592Sbms	IF_ADDR_LOCK(ifp);
1040189592Sbms	TAILQ_FOREACH(ifma, &ifp->if_multiaddrs, ifma_link) {
1041189592Sbms		if (ifma->ifma_addr->sa_family != AF_INET)
1042189592Sbms			continue;
1043189592Sbms		inm = (struct in_multi *)ifma->ifma_protospec;
1044189592Sbms		LIST_INSERT_HEAD(&purgeinms, inm, inm_link);
1045162718Sbms	}
1046189592Sbms	IF_ADDR_UNLOCK(ifp);
1047150296Srwatson
1048189592Sbms	LIST_FOREACH_SAFE(inm, &purgeinms, inm_link, tinm) {
1049189592Sbms		inm_release_locked(inm);
1050189592Sbms		LIST_REMOVE(inm, inm_link);
1051189592Sbms	}
1052189592Sbms	igmp_ifdetach(ifp);
1053150296Srwatson
1054189592Sbms	IN_MULTI_UNLOCK();
1055150296Srwatson}
1056186119Sqingli
1057186119Sqingli#include <sys/syslog.h>
1058186119Sqingli#include <net/if_dl.h>
1059186119Sqingli#include <netinet/if_ether.h>
1060186119Sqingli
1061186119Sqinglistruct in_llentry {
1062186119Sqingli	struct llentry		base;
1063186119Sqingli	struct sockaddr_in	l3_addr4;
1064186119Sqingli};
1065186119Sqingli
1066186119Sqinglistatic struct llentry *
1067186119Sqingliin_lltable_new(const struct sockaddr *l3addr, u_int flags)
1068186119Sqingli{
1069186119Sqingli	struct in_llentry *lle;
1070186119Sqingli
1071186119Sqingli	lle = malloc(sizeof(struct in_llentry), M_LLTABLE, M_DONTWAIT | M_ZERO);
1072186119Sqingli	if (lle == NULL)		/* NB: caller generates msg */
1073186119Sqingli		return NULL;
1074186119Sqingli
1075186119Sqingli	callout_init(&lle->base.la_timer, CALLOUT_MPSAFE);
1076186119Sqingli	/*
1077186119Sqingli	 * For IPv4 this will trigger "arpresolve" to generate
1078186119Sqingli	 * an ARP request.
1079186119Sqingli	 */
1080186119Sqingli	lle->base.la_expire = time_second; /* mark expired */
1081186119Sqingli	lle->l3_addr4 = *(const struct sockaddr_in *)l3addr;
1082186119Sqingli	lle->base.lle_refcnt = 1;
1083186119Sqingli	LLE_LOCK_INIT(&lle->base);
1084186119Sqingli	return &lle->base;
1085186119Sqingli}
1086186119Sqingli
1087186119Sqingli/*
1088186119Sqingli * Deletes an address from the address table.
1089186119Sqingli * This function is called by the timer functions
1090186119Sqingli * such as arptimer() and nd6_llinfo_timer(), and
1091186119Sqingli * the caller does the locking.
1092186119Sqingli */
1093186119Sqinglistatic void
1094186119Sqingliin_lltable_free(struct lltable *llt, struct llentry *lle)
1095186119Sqingli{
1096186150Skmacy	LLE_WUNLOCK(lle);
1097186150Skmacy	LLE_LOCK_DESTROY(lle);
1098186119Sqingli	free(lle, M_LLTABLE);
1099186119Sqingli}
1100186119Sqingli
1101186119Sqinglistatic int
1102186119Sqingliin_lltable_rtcheck(struct ifnet *ifp, const struct sockaddr *l3addr)
1103186119Sqingli{
1104186119Sqingli	struct rtentry *rt;
1105186119Sqingli
1106186119Sqingli	KASSERT(l3addr->sa_family == AF_INET,
1107186119Sqingli	    ("sin_family %d", l3addr->sa_family));
1108186119Sqingli
1109186119Sqingli	/* XXX rtalloc1 should take a const param */
1110186119Sqingli	rt = rtalloc1(__DECONST(struct sockaddr *, l3addr), 0, 0);
1111186119Sqingli	if (rt == NULL || (rt->rt_flags & RTF_GATEWAY) || rt->rt_ifp != ifp) {
1112186119Sqingli		log(LOG_INFO, "IPv4 address: \"%s\" is not on the network\n",
1113186119Sqingli		    inet_ntoa(((const struct sockaddr_in *)l3addr)->sin_addr));
1114186119Sqingli		if (rt != NULL)
1115186119Sqingli			RTFREE_LOCKED(rt);
1116186119Sqingli		return (EINVAL);
1117186119Sqingli	}
1118186119Sqingli	RTFREE_LOCKED(rt);
1119186119Sqingli	return 0;
1120186119Sqingli}
1121186119Sqingli
1122186119Sqingli/*
1123186119Sqingli * Return NULL if not found or marked for deletion.
1124186119Sqingli * If found return lle read locked.
1125186119Sqingli */
1126186119Sqinglistatic struct llentry *
1127186119Sqingliin_lltable_lookup(struct lltable *llt, u_int flags, const struct sockaddr *l3addr)
1128186119Sqingli{
1129186119Sqingli	const struct sockaddr_in *sin = (const struct sockaddr_in *)l3addr;
1130186119Sqingli	struct ifnet *ifp = llt->llt_ifp;
1131186119Sqingli	struct llentry *lle;
1132186119Sqingli	struct llentries *lleh;
1133186119Sqingli	u_int hashkey;
1134186119Sqingli
1135186119Sqingli	IF_AFDATA_LOCK_ASSERT(ifp);
1136186119Sqingli	KASSERT(l3addr->sa_family == AF_INET,
1137186119Sqingli	    ("sin_family %d", l3addr->sa_family));
1138186119Sqingli
1139186119Sqingli	hashkey = sin->sin_addr.s_addr;
1140186119Sqingli	lleh = &llt->lle_head[LLATBL_HASH(hashkey, LLTBL_HASHMASK)];
1141186119Sqingli	LIST_FOREACH(lle, lleh, lle_next) {
1142186708Sqingli		struct sockaddr_in *sa2 = (struct sockaddr_in *)L3_ADDR(lle);
1143186119Sqingli		if (lle->la_flags & LLE_DELETED)
1144186119Sqingli			continue;
1145186708Sqingli		if (sa2->sin_addr.s_addr == sin->sin_addr.s_addr)
1146186119Sqingli			break;
1147186119Sqingli	}
1148186119Sqingli	if (lle == NULL) {
1149186119Sqingli#ifdef DIAGNOSTICS
1150186119Sqingli		if (flags & LLE_DELETE)
1151186119Sqingli			log(LOG_INFO, "interface address is missing from cache = %p  in delete\n", lle);
1152186119Sqingli#endif
1153186119Sqingli		if (!(flags & LLE_CREATE))
1154186119Sqingli			return (NULL);
1155186119Sqingli		/*
1156186119Sqingli		 * A route that covers the given address must have
1157186119Sqingli		 * been installed 1st because we are doing a resolution,
1158186119Sqingli		 * verify this.
1159186119Sqingli		 */
1160186119Sqingli		if (!(flags & LLE_IFADDR) &&
1161186119Sqingli		    in_lltable_rtcheck(ifp, l3addr) != 0)
1162186119Sqingli			goto done;
1163186119Sqingli
1164186119Sqingli		lle = in_lltable_new(l3addr, flags);
1165186119Sqingli		if (lle == NULL) {
1166186119Sqingli			log(LOG_INFO, "lla_lookup: new lle malloc failed\n");
1167186119Sqingli			goto done;
1168186119Sqingli		}
1169186119Sqingli		lle->la_flags = flags & ~LLE_CREATE;
1170186119Sqingli		if ((flags & (LLE_CREATE | LLE_IFADDR)) == (LLE_CREATE | LLE_IFADDR)) {
1171186119Sqingli			bcopy(IF_LLADDR(ifp), &lle->ll_addr, ifp->if_addrlen);
1172186119Sqingli			lle->la_flags |= (LLE_VALID | LLE_STATIC);
1173186119Sqingli		}
1174186119Sqingli
1175186119Sqingli		lle->lle_tbl  = llt;
1176186119Sqingli		lle->lle_head = lleh;
1177186119Sqingli		LIST_INSERT_HEAD(lleh, lle, lle_next);
1178186119Sqingli	} else if (flags & LLE_DELETE) {
1179186119Sqingli		if (!(lle->la_flags & LLE_IFADDR) || (flags & LLE_IFADDR)) {
1180186119Sqingli			LLE_WLOCK(lle);
1181186119Sqingli			lle->la_flags = LLE_DELETED;
1182186119Sqingli			LLE_WUNLOCK(lle);
1183186119Sqingli#ifdef DIAGNOSTICS
1184186119Sqingli			log(LOG_INFO, "ifaddr cache = %p  is deleted\n", lle);
1185186119Sqingli#endif
1186186119Sqingli		}
1187186119Sqingli		lle = (void *)-1;
1188186119Sqingli
1189186119Sqingli	}
1190186544Sbz	if (LLE_IS_VALID(lle)) {
1191186119Sqingli		if (flags & LLE_EXCLUSIVE)
1192186119Sqingli			LLE_WLOCK(lle);
1193186119Sqingli		else
1194186119Sqingli			LLE_RLOCK(lle);
1195186119Sqingli	}
1196186119Sqinglidone:
1197186119Sqingli	return (lle);
1198186119Sqingli}
1199186119Sqingli
1200186119Sqinglistatic int
1201186119Sqingliin_lltable_dump(struct lltable *llt, struct sysctl_req *wr)
1202186119Sqingli{
1203186119Sqingli#define	SIN(lle)	((struct sockaddr_in *) L3_ADDR(lle))
1204186119Sqingli	struct ifnet *ifp = llt->llt_ifp;
1205186119Sqingli	struct llentry *lle;
1206186119Sqingli	/* XXX stack use */
1207186119Sqingli	struct {
1208186119Sqingli		struct rt_msghdr	rtm;
1209186119Sqingli		struct sockaddr_inarp	sin;
1210186119Sqingli		struct sockaddr_dl	sdl;
1211186119Sqingli	} arpc;
1212186119Sqingli	int error, i;
1213186119Sqingli
1214186119Sqingli	/* XXXXX
1215186119Sqingli	 * current IFNET_RLOCK() is mapped to IFNET_WLOCK()
1216186119Sqingli	 * so it is okay to use this ASSERT, change it when
1217186119Sqingli	 * IFNET lock is finalized
1218186119Sqingli	 */
1219186119Sqingli	IFNET_WLOCK_ASSERT();
1220186119Sqingli
1221186119Sqingli	error = 0;
1222186119Sqingli	for (i = 0; i < LLTBL_HASHTBL_SIZE; i++) {
1223186119Sqingli		LIST_FOREACH(lle, &llt->lle_head[i], lle_next) {
1224186119Sqingli			struct sockaddr_dl *sdl;
1225186119Sqingli
1226186119Sqingli			/* skip deleted entries */
1227186119Sqingli			if ((lle->la_flags & (LLE_DELETED|LLE_VALID)) != LLE_VALID)
1228186119Sqingli				continue;
1229186980Sbz			/* Skip if jailed and not a valid IP of the prison. */
1230188144Sjamie			if (prison_if(wr->td->td_ucred, L3_ADDR(lle)) != 0)
1231186980Sbz				continue;
1232186119Sqingli			/*
1233186119Sqingli			 * produce a msg made of:
1234186119Sqingli			 *  struct rt_msghdr;
1235186119Sqingli			 *  struct sockaddr_inarp; (IPv4)
1236186119Sqingli			 *  struct sockaddr_dl;
1237186119Sqingli			 */
1238186119Sqingli			bzero(&arpc, sizeof(arpc));
1239186119Sqingli			arpc.rtm.rtm_msglen = sizeof(arpc);
1240186935Sharti			arpc.rtm.rtm_version = RTM_VERSION;
1241186935Sharti			arpc.rtm.rtm_type = RTM_GET;
1242186935Sharti			arpc.rtm.rtm_flags = RTF_UP;
1243186935Sharti			arpc.rtm.rtm_addrs = RTA_DST | RTA_GATEWAY;
1244186119Sqingli			arpc.sin.sin_family = AF_INET;
1245186119Sqingli			arpc.sin.sin_len = sizeof(arpc.sin);
1246186119Sqingli			arpc.sin.sin_addr.s_addr = SIN(lle)->sin_addr.s_addr;
1247186119Sqingli
1248186119Sqingli			/* publish */
1249186119Sqingli			if (lle->la_flags & LLE_PUB) {
1250186119Sqingli				arpc.rtm.rtm_flags |= RTF_ANNOUNCE;
1251186119Sqingli				/* proxy only */
1252186119Sqingli				if (lle->la_flags & LLE_PROXY)
1253186119Sqingli					arpc.sin.sin_other = SIN_PROXY;
1254186119Sqingli			}
1255186119Sqingli
1256186119Sqingli			sdl = &arpc.sdl;
1257186119Sqingli			sdl->sdl_family = AF_LINK;
1258186119Sqingli			sdl->sdl_len = sizeof(*sdl);
1259186119Sqingli			sdl->sdl_alen = ifp->if_addrlen;
1260186119Sqingli			sdl->sdl_index = ifp->if_index;
1261186119Sqingli			sdl->sdl_type = ifp->if_type;
1262186119Sqingli			bcopy(&lle->ll_addr, LLADDR(sdl), ifp->if_addrlen);
1263186119Sqingli
1264186119Sqingli			arpc.rtm.rtm_rmx.rmx_expire =
1265186119Sqingli			    lle->la_flags & LLE_STATIC ? 0 : lle->la_expire;
1266186500Sqingli			arpc.rtm.rtm_flags |= (RTF_HOST | RTF_LLDATA);
1267186119Sqingli			if (lle->la_flags & LLE_STATIC)
1268186119Sqingli				arpc.rtm.rtm_flags |= RTF_STATIC;
1269186119Sqingli			arpc.rtm.rtm_index = ifp->if_index;
1270186119Sqingli			error = SYSCTL_OUT(wr, &arpc, sizeof(arpc));
1271186119Sqingli			if (error)
1272186119Sqingli				break;
1273186119Sqingli		}
1274186119Sqingli	}
1275186119Sqingli	return error;
1276186119Sqingli#undef SIN
1277186119Sqingli}
1278186119Sqingli
1279186119Sqinglivoid *
1280186119Sqingliin_domifattach(struct ifnet *ifp)
1281189592Sbms{
1282189592Sbms	struct in_ifinfo *ii;
1283189592Sbms	struct lltable *llt;
1284189592Sbms
1285189592Sbms	ii = malloc(sizeof(struct in_ifinfo), M_IFADDR, M_WAITOK|M_ZERO);
1286189592Sbms
1287189592Sbms	llt = lltable_init(ifp, AF_INET);
1288186119Sqingli	if (llt != NULL) {
1289186119Sqingli		llt->llt_new = in_lltable_new;
1290186119Sqingli		llt->llt_free = in_lltable_free;
1291186119Sqingli		llt->llt_rtcheck = in_lltable_rtcheck;
1292186119Sqingli		llt->llt_lookup = in_lltable_lookup;
1293186119Sqingli		llt->llt_dump = in_lltable_dump;
1294186119Sqingli	}
1295189592Sbms	ii->ii_llt = llt;
1296189592Sbms
1297189592Sbms	ii->ii_igmp = igmp_domifattach(ifp);
1298189592Sbms
1299189592Sbms	return ii;
1300186119Sqingli}
1301186119Sqingli
1302186119Sqinglivoid
1303189592Sbmsin_domifdetach(struct ifnet *ifp, void *aux)
1304186119Sqingli{
1305189592Sbms	struct in_ifinfo *ii = (struct in_ifinfo *)aux;
1306186119Sqingli
1307189592Sbms	igmp_domifdetach(ifp);
1308189592Sbms	lltable_free(ii->ii_llt);
1309189592Sbms	free(ii, M_IFADDR);
1310186119Sqingli}
1311