xref: /freebsd/sys/net/if_ethersubr.c (revision c69aeaad)
1c398230bSWarner Losh /*-
2df8bae1dSRodney W. Grimes  * Copyright (c) 1982, 1989, 1993
3df8bae1dSRodney W. Grimes  *	The Regents of the University of California.  All rights reserved.
4df8bae1dSRodney W. Grimes  *
5df8bae1dSRodney W. Grimes  * Redistribution and use in source and binary forms, with or without
6df8bae1dSRodney W. Grimes  * modification, are permitted provided that the following conditions
7df8bae1dSRodney W. Grimes  * are met:
8df8bae1dSRodney W. Grimes  * 1. Redistributions of source code must retain the above copyright
9df8bae1dSRodney W. Grimes  *    notice, this list of conditions and the following disclaimer.
10df8bae1dSRodney W. Grimes  * 2. Redistributions in binary form must reproduce the above copyright
11df8bae1dSRodney W. Grimes  *    notice, this list of conditions and the following disclaimer in the
12df8bae1dSRodney W. Grimes  *    documentation and/or other materials provided with the distribution.
13df8bae1dSRodney W. Grimes  * 4. Neither the name of the University nor the names of its contributors
14df8bae1dSRodney W. Grimes  *    may be used to endorse or promote products derived from this software
15df8bae1dSRodney W. Grimes  *    without specific prior written permission.
16df8bae1dSRodney W. Grimes  *
17df8bae1dSRodney W. Grimes  * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
18df8bae1dSRodney W. Grimes  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
19df8bae1dSRodney W. Grimes  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
20df8bae1dSRodney W. Grimes  * ARE DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
21df8bae1dSRodney W. Grimes  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
22df8bae1dSRodney W. Grimes  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
23df8bae1dSRodney W. Grimes  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
24df8bae1dSRodney W. Grimes  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
25df8bae1dSRodney W. Grimes  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
26df8bae1dSRodney W. Grimes  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
27df8bae1dSRodney W. Grimes  * SUCH DAMAGE.
28df8bae1dSRodney W. Grimes  *
29df8bae1dSRodney W. Grimes  *	@(#)if_ethersubr.c	8.1 (Berkeley) 6/10/93
30c3aac50fSPeter Wemm  * $FreeBSD$
31df8bae1dSRodney W. Grimes  */
32df8bae1dSRodney W. Grimes 
331d5e9e22SEivind Eklund #include "opt_inet.h"
34cfa1ca9dSYoshinobu Inoue #include "opt_inet6.h"
354cf49a43SJulian Elischer #include "opt_netgraph.h"
366eeac1d9SJulian Elischer #include "opt_mbuf_profiling.h"
377527624eSRobert Watson #include "opt_rss.h"
38430df5f4SEivind Eklund 
39df8bae1dSRodney W. Grimes #include <sys/param.h>
40df8bae1dSRodney W. Grimes #include <sys/systm.h>
41df8bae1dSRodney W. Grimes #include <sys/kernel.h>
42385195c0SMarko Zec #include <sys/lock.h>
43df8bae1dSRodney W. Grimes #include <sys/malloc.h>
4441ee9f1cSPoul-Henning Kamp #include <sys/module.h>
45df8bae1dSRodney W. Grimes #include <sys/mbuf.h>
4610b1fde0SMark Murray #include <sys/random.h>
47df8bae1dSRodney W. Grimes #include <sys/socket.h>
4851a53488SBruce Evans #include <sys/sockio.h>
49602d513cSGarrett Wollman #include <sys/sysctl.h>
50ef1f9169SMarcel Moolenaar #include <sys/uuid.h>
51df8bae1dSRodney W. Grimes 
52df8bae1dSRodney W. Grimes #include <net/if.h>
5376039bc8SGleb Smirnoff #include <net/if_var.h>
54d7647d96SDag-Erling Smørgrav #include <net/if_arp.h>
55df8bae1dSRodney W. Grimes #include <net/netisr.h>
56df8bae1dSRodney W. Grimes #include <net/route.h>
57df8bae1dSRodney W. Grimes #include <net/if_llc.h>
58df8bae1dSRodney W. Grimes #include <net/if_dl.h>
59df8bae1dSRodney W. Grimes #include <net/if_types.h>
602e2de7f2SArchie Cobbs #include <net/bpf.h>
61e1e1452dSArchie Cobbs #include <net/ethernet.h>
62fd6238a6SAndrew Thompson #include <net/if_bridgevar.h>
63c1d93b05SSam Leffler #include <net/if_vlan_var.h>
646e6b3f7cSQing Li #include <net/if_llatbl.h>
657d4317bdSAlexander V. Chernikov #include <net/pfil.h>
664b79449eSBjoern A. Zeeb #include <net/vnet.h>
67df8bae1dSRodney W. Grimes 
6875bf2db3SGleb Smirnoff #include <netpfil/pf/pf_mtag.h>
6975bf2db3SGleb Smirnoff 
7082cd038dSYoshinobu Inoue #if defined(INET) || defined(INET6)
71df8bae1dSRodney W. Grimes #include <netinet/in.h>
72df8bae1dSRodney W. Grimes #include <netinet/in_var.h>
73df8bae1dSRodney W. Grimes #include <netinet/if_ether.h>
747527624eSRobert Watson #include <netinet/in_rss.h>
7554bfbd51SWill Andrews #include <netinet/ip_carp.h>
760bcfa8e4SLuigi Rizzo #include <netinet/ip_var.h>
771d5e9e22SEivind Eklund #endif
7882cd038dSYoshinobu Inoue #ifdef INET6
7982cd038dSYoshinobu Inoue #include <netinet6/nd6.h>
8082cd038dSYoshinobu Inoue #endif
81aed55708SRobert Watson #include <security/mac/mac_framework.h>
82aed55708SRobert Watson 
83d54d93acSEd Maste #ifdef CTASSERT
84d54d93acSEd Maste CTASSERT(sizeof (struct ether_header) == ETHER_ADDR_LEN * 2 + 2);
85d54d93acSEd Maste CTASSERT(sizeof (struct ether_addr) == ETHER_ADDR_LEN);
86d54d93acSEd Maste #endif
87d54d93acSEd Maste 
887d4317bdSAlexander V. Chernikov VNET_DEFINE(struct pfil_head, link_pfil_hook);	/* Packet filter hooks */
897d4317bdSAlexander V. Chernikov 
90e1e1452dSArchie Cobbs /* netgraph node hooks for ng_ether(4) */
91c1d93b05SSam Leffler void	(*ng_ether_input_p)(struct ifnet *ifp, struct mbuf **mp);
92c1d93b05SSam Leffler void	(*ng_ether_input_orphan_p)(struct ifnet *ifp, struct mbuf *m);
93e1e1452dSArchie Cobbs int	(*ng_ether_output_p)(struct ifnet *ifp, struct mbuf **mp);
94e1e1452dSArchie Cobbs void	(*ng_ether_attach_p)(struct ifnet *ifp);
95e1e1452dSArchie Cobbs void	(*ng_ether_detach_p)(struct ifnet *ifp);
96e1e1452dSArchie Cobbs 
97824eb9dcSDavid E. O'Brien void	(*vlan_input_p)(struct ifnet *, struct mbuf *);
989d4fe4b2SBrooks Davis 
99fd6238a6SAndrew Thompson /* if_bridge(4) support */
1008f867517SAndrew Thompson struct mbuf *(*bridge_input_p)(struct ifnet *, struct mbuf *);
1018f867517SAndrew Thompson int	(*bridge_output_p)(struct ifnet *, struct mbuf *,
1028f867517SAndrew Thompson 		struct sockaddr *, struct rtentry *);
103c8b01292SAndrew Thompson void	(*bridge_dn_p)(struct mbuf *, struct ifnet *);
1048f867517SAndrew Thompson 
10518242d3bSAndrew Thompson /* if_lagg(4) support */
10618242d3bSAndrew Thompson struct mbuf *(*lagg_input_p)(struct ifnet *, struct mbuf *);
107b47888ceSAndrew Thompson 
108e589108dSRobert Watson static const u_char etherbroadcastaddr[ETHER_ADDR_LEN] =
109868d8b62SMatthew N. Dodd 			{ 0xff, 0xff, 0xff, 0xff, 0xff, 0xff };
110868d8b62SMatthew N. Dodd 
111929ddbbbSAlfred Perlstein static	int ether_resolvemulti(struct ifnet *, struct sockaddr **,
112929ddbbbSAlfred Perlstein 		struct sockaddr *);
113d3c351c5SMarko Zec #ifdef VIMAGE
114d3c351c5SMarko Zec static	void ether_reassign(struct ifnet *, struct vnet *, char *);
115d3c351c5SMarko Zec #endif
116868d8b62SMatthew N. Dodd 
11769462a82SBruce M Simpson #define	ETHER_IS_BROADCAST(addr) \
11869462a82SBruce M Simpson 	(bcmp(etherbroadcastaddr, (addr), ETHER_ADDR_LEN) == 0)
11969462a82SBruce M Simpson 
1204c8e8c05SJulian Elischer #define senderr(e) do { error = (e); goto bad;} while (0)
121df8bae1dSRodney W. Grimes 
12222f8ce43SAlexander V. Chernikov static void
12322f8ce43SAlexander V. Chernikov update_mbuf_csumflags(struct mbuf *src, struct mbuf *dst)
12422f8ce43SAlexander V. Chernikov {
12522f8ce43SAlexander V. Chernikov 	int csum_flags = 0;
12622f8ce43SAlexander V. Chernikov 
12722f8ce43SAlexander V. Chernikov 	if (src->m_pkthdr.csum_flags & CSUM_IP)
12822f8ce43SAlexander V. Chernikov 		csum_flags |= (CSUM_IP_CHECKED|CSUM_IP_VALID);
12922f8ce43SAlexander V. Chernikov 	if (src->m_pkthdr.csum_flags & CSUM_DELAY_DATA)
13022f8ce43SAlexander V. Chernikov 		csum_flags |= (CSUM_DATA_VALID|CSUM_PSEUDO_HDR);
13122f8ce43SAlexander V. Chernikov 	if (src->m_pkthdr.csum_flags & CSUM_SCTP)
13222f8ce43SAlexander V. Chernikov 		csum_flags |= CSUM_SCTP_VALID;
13322f8ce43SAlexander V. Chernikov 	dst->m_pkthdr.csum_flags |= csum_flags;
13422f8ce43SAlexander V. Chernikov 	if (csum_flags & CSUM_DATA_VALID)
13522f8ce43SAlexander V. Chernikov 		dst->m_pkthdr.csum_data = 0xffff;
13622f8ce43SAlexander V. Chernikov }
13722f8ce43SAlexander V. Chernikov 
138df8bae1dSRodney W. Grimes /*
139df8bae1dSRodney W. Grimes  * Ethernet output routine.
140df8bae1dSRodney W. Grimes  * Encapsulate a packet of type family for the local net.
141df8bae1dSRodney W. Grimes  * Use trailer local net encapsulation if enough data in first
142df8bae1dSRodney W. Grimes  * packet leaves a multiple of 512 bytes of data in remainder.
143df8bae1dSRodney W. Grimes  */
144df8bae1dSRodney W. Grimes int
14572fd1b6aSDag-Erling Smørgrav ether_output(struct ifnet *ifp, struct mbuf *m,
14647e8d432SGleb Smirnoff 	const struct sockaddr *dst, struct route *ro)
147df8bae1dSRodney W. Grimes {
148df8bae1dSRodney W. Grimes 	short type;
149279aa3d4SKip Macy 	int error = 0, hdrcmplt = 0;
150c69aeaadSAlexander V. Chernikov 	u_char edst[ETHER_ADDR_LEN];
1516e6b3f7cSQing Li 	struct llentry *lle = NULL;
152279aa3d4SKip Macy 	struct rtentry *rt0 = NULL;
153098a8c3bSMatthew N. Dodd 	struct ether_header *eh;
15460ee3847SMax Laier 	struct pf_mtag *t;
155c54c76ccSOleg Bulyzhin 	int loop_copy = 1;
156d32864c3SRobert Watson 	int hlen;	/* link layer header length */
157df8bae1dSRodney W. Grimes 
158279aa3d4SKip Macy 	if (ro != NULL) {
1599fca4f79SQing Li 		if (!(m->m_flags & (M_BCAST | M_MCAST)))
160279aa3d4SKip Macy 			lle = ro->ro_lle;
161279aa3d4SKip Macy 		rt0 = ro->ro_rt;
162279aa3d4SKip Macy 	}
16343b29369SRobert Watson #ifdef MAC
16430d239bcSRobert Watson 	error = mac_ifnet_check_transmit(ifp, m);
16543b29369SRobert Watson 	if (error)
16643b29369SRobert Watson 		senderr(error);
16743b29369SRobert Watson #endif
16843b29369SRobert Watson 
1696eeac1d9SJulian Elischer 	M_PROFILE(m);
170afbe3a0fSPoul-Henning Kamp 	if (ifp->if_flags & IFF_MONITOR)
171afbe3a0fSPoul-Henning Kamp 		senderr(ENETDOWN);
17213f4c340SRobert Watson 	if (!((ifp->if_flags & IFF_UP) &&
17313f4c340SRobert Watson 	    (ifp->if_drv_flags & IFF_DRV_RUNNING)))
174df8bae1dSRodney W. Grimes 		senderr(ENETDOWN);
1757f760c48SMatthew N. Dodd 
17684dd0fd0SJulian Elischer 	hlen = ETHER_HDR_LEN;
177df8bae1dSRodney W. Grimes 	switch (dst->sa_family) {
178df8bae1dSRodney W. Grimes #ifdef INET
179df8bae1dSRodney W. Grimes 	case AF_INET:
180279aa3d4SKip Macy 		if (lle != NULL && (lle->la_flags & LLE_VALID))
181279aa3d4SKip Macy 			memcpy(edst, &lle->ll_addr.mac16, sizeof(edst));
182279aa3d4SKip Macy 		else
1836e6b3f7cSQing Li 			error = arpresolve(ifp, rt0, m, dst, edst, &lle);
184cd46a114SLuigi Rizzo 		if (error)
185cd46a114SLuigi Rizzo 			return (error == EWOULDBLOCK ? 0 : error);
18634bed8b0SDavid Greenman 		type = htons(ETHERTYPE_IP);
187df8bae1dSRodney W. Grimes 		break;
18843a6c75aSMatthew N. Dodd 	case AF_ARP:
18943a6c75aSMatthew N. Dodd 	{
19043a6c75aSMatthew N. Dodd 		struct arphdr *ah;
19143a6c75aSMatthew N. Dodd 		ah = mtod(m, struct arphdr *);
19243a6c75aSMatthew N. Dodd 		ah->ar_hrd = htons(ARPHRD_ETHER);
19343a6c75aSMatthew N. Dodd 
194c54c76ccSOleg Bulyzhin 		loop_copy = 0; /* if this is for us, don't do it */
19543a6c75aSMatthew N. Dodd 
19643a6c75aSMatthew N. Dodd 		switch(ntohs(ah->ar_op)) {
19743a6c75aSMatthew N. Dodd 		case ARPOP_REVREQUEST:
19843a6c75aSMatthew N. Dodd 		case ARPOP_REVREPLY:
19943a6c75aSMatthew N. Dodd 			type = htons(ETHERTYPE_REVARP);
20043a6c75aSMatthew N. Dodd 			break;
20143a6c75aSMatthew N. Dodd 		case ARPOP_REQUEST:
20243a6c75aSMatthew N. Dodd 		case ARPOP_REPLY:
20343a6c75aSMatthew N. Dodd 		default:
20443a6c75aSMatthew N. Dodd 			type = htons(ETHERTYPE_ARP);
20543a6c75aSMatthew N. Dodd 			break;
20643a6c75aSMatthew N. Dodd 		}
20743a6c75aSMatthew N. Dodd 
20843a6c75aSMatthew N. Dodd 		if (m->m_flags & M_BCAST)
20943a6c75aSMatthew N. Dodd 			bcopy(ifp->if_broadcastaddr, edst, ETHER_ADDR_LEN);
21043a6c75aSMatthew N. Dodd 		else
21143a6c75aSMatthew N. Dodd 			bcopy(ar_tha(ah), edst, ETHER_ADDR_LEN);
21243a6c75aSMatthew N. Dodd 
21343a6c75aSMatthew N. Dodd 	}
21443a6c75aSMatthew N. Dodd 	break;
215df8bae1dSRodney W. Grimes #endif
21682cd038dSYoshinobu Inoue #ifdef INET6
21782cd038dSYoshinobu Inoue 	case AF_INET6:
218279aa3d4SKip Macy 		if (lle != NULL && (lle->la_flags & LLE_VALID))
219279aa3d4SKip Macy 			memcpy(edst, &lle->ll_addr.mac16, sizeof(edst));
220279aa3d4SKip Macy 		else
2219928dafbSQing Li 			error = nd6_storelladdr(ifp, m, dst, (u_char *)edst, &lle);
222cd46a114SLuigi Rizzo 		if (error)
223cd46a114SLuigi Rizzo 			return error;
22482cd038dSYoshinobu Inoue 		type = htons(ETHERTYPE_IPV6);
22582cd038dSYoshinobu Inoue 		break;
22682cd038dSYoshinobu Inoue #endif
227114ae644SMike Smith 	case pseudo_AF_HDRCMPLT:
22847e8d432SGleb Smirnoff 	    {
229114ae644SMike Smith 		hdrcmplt = 1;
230114ae644SMike Smith 		/* FALLTHROUGH */
231114ae644SMike Smith 
232df8bae1dSRodney W. Grimes 	case AF_UNSPEC:
233c54c76ccSOleg Bulyzhin 		loop_copy = 0; /* if this is for us, don't do it */
234c69aeaadSAlexander V. Chernikov 		eh = (struct ether_header *)dst->sa_data;
23594a5d9b6SDavid Greenman 		(void)memcpy(edst, eh->ether_dhost, sizeof (edst));
236df8bae1dSRodney W. Grimes 		type = eh->ether_type;
237df8bae1dSRodney W. Grimes 		break;
23847e8d432SGleb Smirnoff             }
239df8bae1dSRodney W. Grimes 	default:
24029e1b85fSBrooks Davis 		if_printf(ifp, "can't handle af%d\n", dst->sa_family);
241df8bae1dSRodney W. Grimes 		senderr(EAFNOSUPPORT);
242df8bae1dSRodney W. Grimes 	}
243df8bae1dSRodney W. Grimes 
2446e6b3f7cSQing Li 	if (lle != NULL && (lle->la_flags & LLE_IFADDR)) {
24522f8ce43SAlexander V. Chernikov 		update_mbuf_csumflags(m, m);
2466e6b3f7cSQing Li 		return (if_simloop(ifp, m, dst->sa_family, 0));
2476e6b3f7cSQing Li 	}
2486e6b3f7cSQing Li 
249df8bae1dSRodney W. Grimes 	/*
250df8bae1dSRodney W. Grimes 	 * Add local net header.  If no space in first mbuf,
251df8bae1dSRodney W. Grimes 	 * allocate another.
252df8bae1dSRodney W. Grimes 	 */
253eb1b1807SGleb Smirnoff 	M_PREPEND(m, ETHER_HDR_LEN, M_NOWAIT);
2542166ffe8SRobert Watson 	if (m == NULL)
255df8bae1dSRodney W. Grimes 		senderr(ENOBUFS);
256df8bae1dSRodney W. Grimes 	eh = mtod(m, struct ether_header *);
257c69aeaadSAlexander V. Chernikov 	if (hdrcmplt == 0) {
258c69aeaadSAlexander V. Chernikov 		memcpy(&eh->ether_type, &type, sizeof(eh->ether_type));
259c69aeaadSAlexander V. Chernikov 		memcpy(eh->ether_dhost, edst, sizeof (edst));
260c69aeaadSAlexander V. Chernikov 		memcpy(eh->ether_shost, IF_LLADDR(ifp),sizeof(eh->ether_shost));
261c69aeaadSAlexander V. Chernikov 	}
262ed7509acSJulian Elischer 
263ed7509acSJulian Elischer 	/*
264ed7509acSJulian Elischer 	 * If a simplex interface, and the packet is being sent to our
265ed7509acSJulian Elischer 	 * Ethernet address or a broadcast address, loopback a copy.
266ed7509acSJulian Elischer 	 * XXX To make a simplex device behave exactly like a duplex
267ed7509acSJulian Elischer 	 * device, we should copy in the case of sending to our own
268ed7509acSJulian Elischer 	 * ethernet address (thus letting the original actually appear
269ed7509acSJulian Elischer 	 * on the wire). However, we don't do that here for security
270ed7509acSJulian Elischer 	 * reasons and compatibility with the original behavior.
271ed7509acSJulian Elischer 	 */
272c54c76ccSOleg Bulyzhin 	if ((ifp->if_flags & IFF_SIMPLEX) && loop_copy &&
27360ee3847SMax Laier 	    ((t = pf_find_mtag(m)) == NULL || !t->routed)) {
274c54c76ccSOleg Bulyzhin 		if (m->m_flags & M_BCAST) {
27506f684b0SMatthew N. Dodd 			struct mbuf *n;
276ed7509acSJulian Elischer 
277294dd290SLuigi Rizzo 			/*
278294dd290SLuigi Rizzo 			 * Because if_simloop() modifies the packet, we need a
279294dd290SLuigi Rizzo 			 * writable copy through m_dup() instead of a readonly
280294dd290SLuigi Rizzo 			 * one as m_copy[m] would give us. The alternative would
281294dd290SLuigi Rizzo 			 * be to modify if_simloop() to handle the readonly mbuf,
282294dd290SLuigi Rizzo 			 * but performancewise it is mostly equivalent (trading
283294dd290SLuigi Rizzo 			 * extra data copying vs. extra locking).
2849983b3c0SYaroslav Tykhiy 			 *
2859983b3c0SYaroslav Tykhiy 			 * XXX This is a local workaround.  A number of less
2869983b3c0SYaroslav Tykhiy 			 * often used kernel parts suffer from the same bug.
2879983b3c0SYaroslav Tykhiy 			 * See PR kern/105943 for a proposed general solution.
288294dd290SLuigi Rizzo 			 */
289eb1b1807SGleb Smirnoff 			if ((n = m_dup(m, M_NOWAIT)) != NULL) {
29022f8ce43SAlexander V. Chernikov 				update_mbuf_csumflags(m, n);
29106a429a3SArchie Cobbs 				(void)if_simloop(ifp, n, dst->sa_family, hlen);
292c1404dc0SArchie Cobbs 			} else
2933751dddbSGleb Smirnoff 				if_inc_counter(ifp, IFCOUNTER_IQDROPS, 1);
29406f684b0SMatthew N. Dodd 		} else if (bcmp(eh->ether_dhost, eh->ether_shost,
29506f684b0SMatthew N. Dodd 				ETHER_ADDR_LEN) == 0) {
29622f8ce43SAlexander V. Chernikov 			update_mbuf_csumflags(m, m);
29706a429a3SArchie Cobbs 			(void) if_simloop(ifp, m, dst->sa_family, hlen);
298ed7509acSJulian Elischer 			return (0);	/* XXX */
299ed7509acSJulian Elischer 		}
300ed7509acSJulian Elischer 	}
3012e2de7f2SArchie Cobbs 
3023f7d1396SAndrew Thompson        /*
3033f7d1396SAndrew Thompson 	* Bridges require special output handling.
3043f7d1396SAndrew Thompson 	*/
3053f7d1396SAndrew Thompson 	if (ifp->if_bridge) {
3063f7d1396SAndrew Thompson 		BRIDGE_OUTPUT(ifp, m, error);
3073f7d1396SAndrew Thompson 		return (error);
3083f7d1396SAndrew Thompson 	}
3093f7d1396SAndrew Thompson 
310259d2d54SBjoern A. Zeeb #if defined(INET) || defined(INET6)
311a9771948SGleb Smirnoff 	if (ifp->if_carp &&
31208b68b0eSGleb Smirnoff 	    (error = (*carp_output_p)(ifp, m, dst)))
313a9771948SGleb Smirnoff 		goto bad;
314a9771948SGleb Smirnoff #endif
315a9771948SGleb Smirnoff 
316e1e1452dSArchie Cobbs 	/* Handle ng_ether(4) processing, if any */
317833e8dc5SGleb Smirnoff 	if (ifp->if_l2com != NULL) {
318514bcb89SPoul-Henning Kamp 		KASSERT(ng_ether_output_p != NULL,
319514bcb89SPoul-Henning Kamp 		    ("ng_ether_output_p is NULL"));
320e1e1452dSArchie Cobbs 		if ((error = (*ng_ether_output_p)(ifp, &m)) != 0) {
321e1e1452dSArchie Cobbs bad:			if (m != NULL)
322e1e1452dSArchie Cobbs 				m_freem(m);
323e1e1452dSArchie Cobbs 			return (error);
324e1e1452dSArchie Cobbs 		}
325e1e1452dSArchie Cobbs 		if (m == NULL)
326e1e1452dSArchie Cobbs 			return (0);
327e1e1452dSArchie Cobbs 	}
328e1e1452dSArchie Cobbs 
329e1e1452dSArchie Cobbs 	/* Continue with link-layer output */
330e1e1452dSArchie Cobbs 	return ether_output_frame(ifp, m);
331e1e1452dSArchie Cobbs }
332e1e1452dSArchie Cobbs 
333e1e1452dSArchie Cobbs /*
334e1e1452dSArchie Cobbs  * Ethernet link layer output routine to send a raw frame to the device.
335e1e1452dSArchie Cobbs  *
336e1e1452dSArchie Cobbs  * This assumes that the 14 byte Ethernet header is present and contiguous
337e1e1452dSArchie Cobbs  * in the first mbuf (if BRIDGE'ing).
338e1e1452dSArchie Cobbs  */
339e1e1452dSArchie Cobbs int
340c1d93b05SSam Leffler ether_output_frame(struct ifnet *ifp, struct mbuf *m)
341e1e1452dSArchie Cobbs {
3427d4317bdSAlexander V. Chernikov 	int i;
3432b25acc1SLuigi Rizzo 
3447d4317bdSAlexander V. Chernikov 	if (PFIL_HOOKED(&V_link_pfil_hook)) {
3457d4317bdSAlexander V. Chernikov 		i = pfil_run_hooks(&V_link_pfil_hook, &m, ifp, PFIL_OUT, NULL);
3467d4317bdSAlexander V. Chernikov 
3477d4317bdSAlexander V. Chernikov 		if (i != 0)
3487d4317bdSAlexander V. Chernikov 			return (EACCES);
3497d4317bdSAlexander V. Chernikov 
3507d4317bdSAlexander V. Chernikov 		if (m == NULL)
3517d4317bdSAlexander V. Chernikov 			return (0);
3524b984093SLuigi Rizzo 	}
3532b25acc1SLuigi Rizzo 
354df8bae1dSRodney W. Grimes 	/*
355df5e1987SJonathan Lemon 	 * Queue message on interface, update output statistics if
356df5e1987SJonathan Lemon 	 * successful, and start output if interface not yet active.
357df8bae1dSRodney W. Grimes 	 */
358aea78d20SKip Macy 	return ((ifp->if_transmit)(ifp, m));
359df8bae1dSRodney W. Grimes }
360df8bae1dSRodney W. Grimes 
361d7647d96SDag-Erling Smørgrav #if defined(INET) || defined(INET6)
362d7647d96SDag-Erling Smørgrav #endif
3634b984093SLuigi Rizzo 
3644b984093SLuigi Rizzo /*
365c1d93b05SSam Leffler  * Process a received Ethernet packet; the packet is in the
366c1d93b05SSam Leffler  * mbuf chain m with the ethernet header at the front.
367df8bae1dSRodney W. Grimes  */
368c1d93b05SSam Leffler static void
3696cb52192SRobert Watson ether_input_internal(struct ifnet *ifp, struct mbuf *m)
370df8bae1dSRodney W. Grimes {
371c1d93b05SSam Leffler 	struct ether_header *eh;
372c1d93b05SSam Leffler 	u_short etype;
373df8bae1dSRodney W. Grimes 
37469462a82SBruce M Simpson 	if ((ifp->if_flags & IFF_UP) == 0) {
37569462a82SBruce M Simpson 		m_freem(m);
37669462a82SBruce M Simpson 		return;
37769462a82SBruce M Simpson 	}
37869462a82SBruce M Simpson #ifdef DIAGNOSTIC
37969462a82SBruce M Simpson 	if ((ifp->if_drv_flags & IFF_DRV_RUNNING) == 0) {
38069462a82SBruce M Simpson 		if_printf(ifp, "discard frame at !IFF_DRV_RUNNING\n");
38169462a82SBruce M Simpson 		m_freem(m);
38269462a82SBruce M Simpson 		return;
38369462a82SBruce M Simpson 	}
38469462a82SBruce M Simpson #endif
385c1d93b05SSam Leffler 	/*
386c1d93b05SSam Leffler 	 * Do consistency checks to verify assumptions
387c1d93b05SSam Leffler 	 * made by code past this point.
388c1d93b05SSam Leffler 	 */
389c1d93b05SSam Leffler 	if ((m->m_flags & M_PKTHDR) == 0) {
390c1d93b05SSam Leffler 		if_printf(ifp, "discard frame w/o packet header\n");
3913751dddbSGleb Smirnoff 		if_inc_counter(ifp, IFCOUNTER_IERRORS, 1);
392c939f1aeSLuigi Rizzo 		m_freem(m);
393c939f1aeSLuigi Rizzo 		return;
394c939f1aeSLuigi Rizzo 	}
395797f247bSMatthew N. Dodd 	if (m->m_len < ETHER_HDR_LEN) {
396c1d93b05SSam Leffler 		/* XXX maybe should pullup? */
397c1d93b05SSam Leffler 		if_printf(ifp, "discard frame w/o leading ethernet "
398c1d93b05SSam Leffler 				"header (len %u pkt len %u)\n",
399c1d93b05SSam Leffler 				m->m_len, m->m_pkthdr.len);
4003751dddbSGleb Smirnoff 		if_inc_counter(ifp, IFCOUNTER_IERRORS, 1);
401c1d93b05SSam Leffler 		m_freem(m);
402c1d93b05SSam Leffler 		return;
4032e2de7f2SArchie Cobbs 	}
404c1d93b05SSam Leffler 	eh = mtod(m, struct ether_header *);
405c1d93b05SSam Leffler 	etype = ntohs(eh->ether_type);
406c1d93b05SSam Leffler 	if (m->m_pkthdr.rcvif == NULL) {
407c1d93b05SSam Leffler 		if_printf(ifp, "discard frame w/o interface pointer\n");
4083751dddbSGleb Smirnoff 		if_inc_counter(ifp, IFCOUNTER_IERRORS, 1);
409c1d93b05SSam Leffler 		m_freem(m);
410c1d93b05SSam Leffler 		return;
411c1d93b05SSam Leffler 	}
412c1d93b05SSam Leffler #ifdef DIAGNOSTIC
413c1d93b05SSam Leffler 	if (m->m_pkthdr.rcvif != ifp) {
4149bf40edeSBrooks Davis 		if_printf(ifp, "Warning, frame marked as received on %s\n",
4159bf40edeSBrooks Davis 			m->m_pkthdr.rcvif->if_xname);
416c1d93b05SSam Leffler 	}
417c1d93b05SSam Leffler #endif
418c1d93b05SSam Leffler 
41921ca7b57SMarko Zec 	CURVNET_SET_QUIET(ifp->if_vnet);
42021ca7b57SMarko Zec 
42169462a82SBruce M Simpson 	if (ETHER_IS_MULTICAST(eh->ether_dhost)) {
42269462a82SBruce M Simpson 		if (ETHER_IS_BROADCAST(eh->ether_dhost))
42369462a82SBruce M Simpson 			m->m_flags |= M_BCAST;
42469462a82SBruce M Simpson 		else
42569462a82SBruce M Simpson 			m->m_flags |= M_MCAST;
4263751dddbSGleb Smirnoff 		if_inc_counter(ifp, IFCOUNTER_IMCASTS, 1);
42769462a82SBruce M Simpson 	}
42869462a82SBruce M Simpson 
429533d8562SRobert Watson #ifdef MAC
430533d8562SRobert Watson 	/*
431533d8562SRobert Watson 	 * Tag the mbuf with an appropriate MAC label before any other
432533d8562SRobert Watson 	 * consumers can get to it.
433533d8562SRobert Watson 	 */
43430d239bcSRobert Watson 	mac_ifnet_create_mbuf(ifp, m);
435533d8562SRobert Watson #endif
436533d8562SRobert Watson 
437c1d93b05SSam Leffler 	/*
43869462a82SBruce M Simpson 	 * Give bpf a chance at the packet.
439c1d93b05SSam Leffler 	 */
440d05d4616SChristian S.J. Peron 	ETHER_BPF_MTAP(ifp, m);
4412e2de7f2SArchie Cobbs 
44269462a82SBruce M Simpson 	/*
44369462a82SBruce M Simpson 	 * If the CRC is still on the packet, trim it off. We do this once
44469462a82SBruce M Simpson 	 * and once only in case we are re-entered. Nothing else on the
44569462a82SBruce M Simpson 	 * Ethernet receive path expects to see the FCS.
44669462a82SBruce M Simpson 	 */
447c1d93b05SSam Leffler 	if (m->m_flags & M_HASFCS) {
448c1d93b05SSam Leffler 		m_adj(m, -ETHER_CRC_LEN);
449c1d93b05SSam Leffler 		m->m_flags &= ~M_HASFCS;
450c1d93b05SSam Leffler 	}
451c1d93b05SSam Leffler 
4524cdc1f54SGleb Smirnoff 	if (!(ifp->if_capenable & IFCAP_HWSTATS))
4533751dddbSGleb Smirnoff 		if_inc_counter(ifp, IFCOUNTER_IBYTES, m->m_pkthdr.len);
45405463bb5SDavid Greenman 
45569462a82SBruce M Simpson 	/* Allow monitor mode to claim this frame, after stats are updated. */
456de572b37SChristian S.J. Peron 	if (ifp->if_flags & IFF_MONITOR) {
457de572b37SChristian S.J. Peron 		m_freem(m);
45821ca7b57SMarko Zec 		CURVNET_RESTORE();
459de572b37SChristian S.J. Peron 		return;
460de572b37SChristian S.J. Peron 	}
461de572b37SChristian S.J. Peron 
46218242d3bSAndrew Thompson 	/* Handle input from a lagg(4) port */
463b47888ceSAndrew Thompson 	if (ifp->if_type == IFT_IEEE8023ADLAG) {
46418242d3bSAndrew Thompson 		KASSERT(lagg_input_p != NULL,
46518242d3bSAndrew Thompson 		    ("%s: if_lagg not loaded!", __func__));
46618242d3bSAndrew Thompson 		m = (*lagg_input_p)(ifp, m);
467b47888ceSAndrew Thompson 		if (m != NULL)
468b47888ceSAndrew Thompson 			ifp = m->m_pkthdr.rcvif;
4692db13e75SMarko Zec 		else {
4702db13e75SMarko Zec 			CURVNET_RESTORE();
471b47888ceSAndrew Thompson 			return;
472b47888ceSAndrew Thompson 		}
4732db13e75SMarko Zec 	}
474b47888ceSAndrew Thompson 
47569462a82SBruce M Simpson 	/*
47669462a82SBruce M Simpson 	 * If the hardware did not process an 802.1Q tag, do this now,
47769462a82SBruce M Simpson 	 * to allow 802.1P priority frames to be passed to the main input
47869462a82SBruce M Simpson 	 * path correctly.
47969462a82SBruce M Simpson 	 * TODO: Deal with Q-in-Q frames, but not arbitrary nesting levels.
48069462a82SBruce M Simpson 	 */
48169462a82SBruce M Simpson 	if ((m->m_flags & M_VLANTAG) == 0 && etype == ETHERTYPE_VLAN) {
48269462a82SBruce M Simpson 		struct ether_vlan_header *evl;
48369462a82SBruce M Simpson 
48469462a82SBruce M Simpson 		if (m->m_len < sizeof(*evl) &&
48569462a82SBruce M Simpson 		    (m = m_pullup(m, sizeof(*evl))) == NULL) {
486402d5e27SBruce M Simpson #ifdef DIAGNOSTIC
48769462a82SBruce M Simpson 			if_printf(ifp, "cannot pullup VLAN header\n");
488402d5e27SBruce M Simpson #endif
4893751dddbSGleb Smirnoff 			if_inc_counter(ifp, IFCOUNTER_IERRORS, 1);
49069462a82SBruce M Simpson 			m_freem(m);
4912db13e75SMarko Zec 			CURVNET_RESTORE();
49269462a82SBruce M Simpson 			return;
49369462a82SBruce M Simpson 		}
49469462a82SBruce M Simpson 
49569462a82SBruce M Simpson 		evl = mtod(m, struct ether_vlan_header *);
49669462a82SBruce M Simpson 		m->m_pkthdr.ether_vtag = ntohs(evl->evl_tag);
49769462a82SBruce M Simpson 		m->m_flags |= M_VLANTAG;
49869462a82SBruce M Simpson 
49969462a82SBruce M Simpson 		bcopy((char *)evl, (char *)evl + ETHER_VLAN_ENCAP_LEN,
50069462a82SBruce M Simpson 		    ETHER_HDR_LEN - ETHER_TYPE_LEN);
50169462a82SBruce M Simpson 		m_adj(m, ETHER_VLAN_ENCAP_LEN);
50297cce87fSGleb Smirnoff 		eh = mtod(m, struct ether_header *);
50369462a82SBruce M Simpson 	}
50469462a82SBruce M Simpson 
505a34c6aebSBjoern A. Zeeb 	M_SETFIB(m, ifp->if_fib);
506a34c6aebSBjoern A. Zeeb 
50769462a82SBruce M Simpson 	/* Allow ng_ether(4) to claim this frame. */
508833e8dc5SGleb Smirnoff 	if (ifp->if_l2com != NULL) {
509514bcb89SPoul-Henning Kamp 		KASSERT(ng_ether_input_p != NULL,
51069462a82SBruce M Simpson 		    ("%s: ng_ether_input_p is NULL", __func__));
51169462a82SBruce M Simpson 		m->m_flags &= ~M_PROMISC;
512c1d93b05SSam Leffler 		(*ng_ether_input_p)(ifp, &m);
51321ca7b57SMarko Zec 		if (m == NULL) {
51421ca7b57SMarko Zec 			CURVNET_RESTORE();
515e1e1452dSArchie Cobbs 			return;
516e1e1452dSArchie Cobbs 		}
5175e9a5429SGleb Smirnoff 		eh = mtod(m, struct ether_header *);
51821ca7b57SMarko Zec 	}
519e1e1452dSArchie Cobbs 
5208f867517SAndrew Thompson 	/*
52169462a82SBruce M Simpson 	 * Allow if_bridge(4) to claim this frame.
52269462a82SBruce M Simpson 	 * The BRIDGE_INPUT() macro will update ifp if the bridge changed it
52369462a82SBruce M Simpson 	 * and the frame should be delivered locally.
5248f867517SAndrew Thompson 	 */
52569462a82SBruce M Simpson 	if (ifp->if_bridge != NULL) {
52669462a82SBruce M Simpson 		m->m_flags &= ~M_PROMISC;
527fd6238a6SAndrew Thompson 		BRIDGE_INPUT(ifp, m);
52821ca7b57SMarko Zec 		if (m == NULL) {
52921ca7b57SMarko Zec 			CURVNET_RESTORE();
5308f867517SAndrew Thompson 			return;
5318f867517SAndrew Thompson 		}
5325e9a5429SGleb Smirnoff 		eh = mtod(m, struct ether_header *);
53321ca7b57SMarko Zec 	}
5348f867517SAndrew Thompson 
535259d2d54SBjoern A. Zeeb #if defined(INET) || defined(INET6)
53669462a82SBruce M Simpson 	/*
53769462a82SBruce M Simpson 	 * Clear M_PROMISC on frame so that carp(4) will see it when the
53869462a82SBruce M Simpson 	 * mbuf flows up to Layer 3.
53969462a82SBruce M Simpson 	 * FreeBSD's implementation of carp(4) uses the inprotosw
54069462a82SBruce M Simpson 	 * to dispatch IPPROTO_CARP. carp(4) also allocates its own
54169462a82SBruce M Simpson 	 * Ethernet addresses of the form 00:00:5e:00:01:xx, which
54269462a82SBruce M Simpson 	 * is outside the scope of the M_PROMISC test below.
54369462a82SBruce M Simpson 	 * TODO: Maintain a hash table of ethernet addresses other than
54469462a82SBruce M Simpson 	 * ether_dhost which may be active on this ifp.
54569462a82SBruce M Simpson 	 */
54654bfbd51SWill Andrews 	if (ifp->if_carp && (*carp_forus_p)(ifp, eh->ether_dhost)) {
54769462a82SBruce M Simpson 		m->m_flags &= ~M_PROMISC;
54869462a82SBruce M Simpson 	} else
54969462a82SBruce M Simpson #endif
55069462a82SBruce M Simpson 	{
55169462a82SBruce M Simpson 		/*
552e7f8c833SBruce M Simpson 		 * If the frame received was not for our MAC address, set the
55369462a82SBruce M Simpson 		 * M_PROMISC flag on the mbuf chain. The frame may need to
55469462a82SBruce M Simpson 		 * be seen by the rest of the Ethernet input path in case of
55569462a82SBruce M Simpson 		 * re-entry (e.g. bridge, vlan, netgraph) but should not be
55669462a82SBruce M Simpson 		 * seen by upper protocol layers.
55769462a82SBruce M Simpson 		 */
55869462a82SBruce M Simpson 		if (!ETHER_IS_MULTICAST(eh->ether_dhost) &&
559e7f8c833SBruce M Simpson 		    bcmp(IF_LLADDR(ifp), eh->ether_dhost, ETHER_ADDR_LEN) != 0)
56069462a82SBruce M Simpson 			m->m_flags |= M_PROMISC;
56169462a82SBruce M Simpson 	}
56269462a82SBruce M Simpson 
563dd50b310SAdrian Chadd 	random_harvest(&(m->m_data), 12, 2, RANDOM_NET_ETHER);
56469462a82SBruce M Simpson 
565acf032f5SRobert Watson 	ether_demux(ifp, m);
56621ca7b57SMarko Zec 	CURVNET_RESTORE();
567e1e1452dSArchie Cobbs }
568e1e1452dSArchie Cobbs 
569e1e1452dSArchie Cobbs /*
5706cb52192SRobert Watson  * Ethernet input dispatch; by default, direct dispatch here regardless of
5717527624eSRobert Watson  * global configuration.  However, if RSS is enabled, hook up RSS affinity
5727527624eSRobert Watson  * so that when deferred or hybrid dispatch is enabled, we can redistribute
5737527624eSRobert Watson  * load based on RSS.
5747527624eSRobert Watson  *
5757527624eSRobert Watson  * XXXRW: Would be nice if the ifnet passed up a flag indicating whether or
5767527624eSRobert Watson  * not it had already done work distribution via multi-queue.  Then we could
5777527624eSRobert Watson  * direct dispatch in the event load balancing was already complete and
5787527624eSRobert Watson  * handle the case of interfaces with different capabilities better.
5797527624eSRobert Watson  *
5807527624eSRobert Watson  * XXXRW: Sort of want an M_DISTRIBUTED flag to avoid multiple distributions
5817527624eSRobert Watson  * at multiple layers?
5827527624eSRobert Watson  *
5837527624eSRobert Watson  * XXXRW: For now, enable all this only if RSS is compiled in, although it
5847527624eSRobert Watson  * works fine without RSS.  Need to characterise the performance overhead
5857527624eSRobert Watson  * of the detour through the netisr code in the event the result is always
5867527624eSRobert Watson  * direct dispatch.
5876cb52192SRobert Watson  */
5886cb52192SRobert Watson static void
5896cb52192SRobert Watson ether_nh_input(struct mbuf *m)
5906cb52192SRobert Watson {
5916cb52192SRobert Watson 
5926cb52192SRobert Watson 	ether_input_internal(m->m_pkthdr.rcvif, m);
5936cb52192SRobert Watson }
5946cb52192SRobert Watson 
5956cb52192SRobert Watson static struct netisr_handler	ether_nh = {
5966cb52192SRobert Watson 	.nh_name = "ether",
5976cb52192SRobert Watson 	.nh_handler = ether_nh_input,
5986cb52192SRobert Watson 	.nh_proto = NETISR_ETHER,
5997527624eSRobert Watson #ifdef RSS
6007527624eSRobert Watson 	.nh_policy = NETISR_POLICY_CPU,
6017527624eSRobert Watson 	.nh_dispatch = NETISR_DISPATCH_DIRECT,
6027527624eSRobert Watson 	.nh_m2cpuid = rss_m2cpuid,
6037527624eSRobert Watson #else
6046cb52192SRobert Watson 	.nh_policy = NETISR_POLICY_SOURCE,
6056cb52192SRobert Watson 	.nh_dispatch = NETISR_DISPATCH_DIRECT,
6067527624eSRobert Watson #endif
6076cb52192SRobert Watson };
6086cb52192SRobert Watson 
6096cb52192SRobert Watson static void
6106cb52192SRobert Watson ether_init(__unused void *arg)
6116cb52192SRobert Watson {
6126cb52192SRobert Watson 
6136cb52192SRobert Watson 	netisr_register(&ether_nh);
6146cb52192SRobert Watson }
6156cb52192SRobert Watson SYSINIT(ether, SI_SUB_INIT_IF, SI_ORDER_ANY, ether_init, NULL);
6166cb52192SRobert Watson 
6176cb52192SRobert Watson static void
6187d4317bdSAlexander V. Chernikov vnet_ether_init(__unused void *arg)
6197d4317bdSAlexander V. Chernikov {
6207d4317bdSAlexander V. Chernikov 	int i;
6217d4317bdSAlexander V. Chernikov 
6227d4317bdSAlexander V. Chernikov 	/* Initialize packet filter hooks. */
6237d4317bdSAlexander V. Chernikov 	V_link_pfil_hook.ph_type = PFIL_TYPE_AF;
6247d4317bdSAlexander V. Chernikov 	V_link_pfil_hook.ph_af = AF_LINK;
6257d4317bdSAlexander V. Chernikov 	if ((i = pfil_head_register(&V_link_pfil_hook)) != 0)
6267d4317bdSAlexander V. Chernikov 		printf("%s: WARNING: unable to register pfil link hook, "
6277d4317bdSAlexander V. Chernikov 			"error %d\n", __func__, i);
6287d4317bdSAlexander V. Chernikov }
6297d4317bdSAlexander V. Chernikov VNET_SYSINIT(vnet_ether_init, SI_SUB_PROTO_IF, SI_ORDER_ANY,
6307d4317bdSAlexander V. Chernikov     vnet_ether_init, NULL);
6317d4317bdSAlexander V. Chernikov 
6327d4317bdSAlexander V. Chernikov static void
6337d4317bdSAlexander V. Chernikov vnet_ether_destroy(__unused void *arg)
6347d4317bdSAlexander V. Chernikov {
6357d4317bdSAlexander V. Chernikov 	int i;
6367d4317bdSAlexander V. Chernikov 
6377d4317bdSAlexander V. Chernikov 	if ((i = pfil_head_unregister(&V_link_pfil_hook)) != 0)
6387d4317bdSAlexander V. Chernikov 		printf("%s: WARNING: unable to unregister pfil link hook, "
6397d4317bdSAlexander V. Chernikov 			"error %d\n", __func__, i);
6407d4317bdSAlexander V. Chernikov }
6417d4317bdSAlexander V. Chernikov VNET_SYSUNINIT(vnet_ether_uninit, SI_SUB_PROTO_IF, SI_ORDER_ANY,
6427d4317bdSAlexander V. Chernikov     vnet_ether_destroy, NULL);
6437d4317bdSAlexander V. Chernikov 
6447d4317bdSAlexander V. Chernikov 
6457d4317bdSAlexander V. Chernikov 
6467d4317bdSAlexander V. Chernikov static void
6476cb52192SRobert Watson ether_input(struct ifnet *ifp, struct mbuf *m)
6486cb52192SRobert Watson {
6496cb52192SRobert Watson 
6504857f5fbSGeorge V. Neville-Neil 	struct mbuf *mn;
6514857f5fbSGeorge V. Neville-Neil 
6524857f5fbSGeorge V. Neville-Neil 	/*
6534857f5fbSGeorge V. Neville-Neil 	 * The drivers are allowed to pass in a chain of packets linked with
6544857f5fbSGeorge V. Neville-Neil 	 * m_nextpkt. We split them up into separate packets here and pass
6554857f5fbSGeorge V. Neville-Neil 	 * them up. This allows the drivers to amortize the receive lock.
6564857f5fbSGeorge V. Neville-Neil 	 */
6574857f5fbSGeorge V. Neville-Neil 	while (m) {
6584857f5fbSGeorge V. Neville-Neil 		mn = m->m_nextpkt;
6594857f5fbSGeorge V. Neville-Neil 		m->m_nextpkt = NULL;
6604857f5fbSGeorge V. Neville-Neil 
6616cb52192SRobert Watson 		/*
6626cb52192SRobert Watson 		 * We will rely on rcvif being set properly in the deferred context,
6636cb52192SRobert Watson 		 * so assert it is correct here.
6646cb52192SRobert Watson 		 */
6656cb52192SRobert Watson 		KASSERT(m->m_pkthdr.rcvif == ifp, ("%s: ifnet mismatch", __func__));
6666cb52192SRobert Watson 		netisr_dispatch(NETISR_ETHER, m);
6674857f5fbSGeorge V. Neville-Neil 		m = mn;
6684857f5fbSGeorge V. Neville-Neil 	}
6696cb52192SRobert Watson }
6706cb52192SRobert Watson 
6716cb52192SRobert Watson /*
672e1e1452dSArchie Cobbs  * Upper layer processing for a received Ethernet packet.
673e1e1452dSArchie Cobbs  */
674e1e1452dSArchie Cobbs void
675c1d93b05SSam Leffler ether_demux(struct ifnet *ifp, struct mbuf *m)
676e1e1452dSArchie Cobbs {
677c1d93b05SSam Leffler 	struct ether_header *eh;
6787d4317bdSAlexander V. Chernikov 	int i, isr;
679e1e1452dSArchie Cobbs 	u_short ether_type;
68069462a82SBruce M Simpson 
68169462a82SBruce M Simpson 	KASSERT(ifp != NULL, ("%s: NULL interface pointer", __func__));
68269462a82SBruce M Simpson 
6837d4317bdSAlexander V. Chernikov 	/* Do not grab PROMISC frames in case we are re-entered. */
6847d4317bdSAlexander V. Chernikov 	if (PFIL_HOOKED(&V_link_pfil_hook) && !(m->m_flags & M_PROMISC)) {
6857d4317bdSAlexander V. Chernikov 		i = pfil_run_hooks(&V_link_pfil_hook, &m, ifp, PFIL_IN, NULL);
6867d4317bdSAlexander V. Chernikov 
6877d4317bdSAlexander V. Chernikov 		if (i != 0 || m == NULL)
6887d4317bdSAlexander V. Chernikov 			return;
68969462a82SBruce M Simpson 	}
6907d4317bdSAlexander V. Chernikov 
691c1d93b05SSam Leffler 	eh = mtod(m, struct ether_header *);
692cd0cd014SJoerg Wunsch 	ether_type = ntohs(eh->ether_type);
693c1d93b05SSam Leffler 
694a9771948SGleb Smirnoff 	/*
69569462a82SBruce M Simpson 	 * If this frame has a VLAN tag other than 0, call vlan_input()
69669462a82SBruce M Simpson 	 * if its module is loaded. Otherwise, drop.
697a9771948SGleb Smirnoff 	 */
69869462a82SBruce M Simpson 	if ((m->m_flags & M_VLANTAG) &&
69969462a82SBruce M Simpson 	    EVL_VLANOFTAG(m->m_pkthdr.ether_vtag) != 0) {
70075ee267cSGleb Smirnoff 		if (ifp->if_vlantrunk == NULL) {
7013751dddbSGleb Smirnoff 			if_inc_counter(ifp, IFCOUNTER_NOPROTO, 1);
7026c23e6ccSRuslan Ermilov 			m_freem(m);
7036c23e6ccSRuslan Ermilov 			return;
7046c23e6ccSRuslan Ermilov 		}
70569462a82SBruce M Simpson 		KASSERT(vlan_input_p != NULL,("%s: VLAN not loaded!",
70669462a82SBruce M Simpson 		    __func__));
70769462a82SBruce M Simpson 		/* Clear before possibly re-entering ether_input(). */
70869462a82SBruce M Simpson 		m->m_flags &= ~M_PROMISC;
709c1d93b05SSam Leffler 		(*vlan_input_p)(ifp, m);
710c1d93b05SSam Leffler 		return;
711c1d93b05SSam Leffler 	}
712c1d93b05SSam Leffler 
713c1d93b05SSam Leffler 	/*
71469462a82SBruce M Simpson 	 * Pass promiscuously received frames to the upper layer if the user
71569462a82SBruce M Simpson 	 * requested this by setting IFF_PPROMISC. Otherwise, drop them.
716c1d93b05SSam Leffler 	 */
71769462a82SBruce M Simpson 	if ((ifp->if_flags & IFF_PPROMISC) == 0 && (m->m_flags & M_PROMISC)) {
718c1d93b05SSam Leffler 		m_freem(m);
719c1d93b05SSam Leffler 		return;
720c1d93b05SSam Leffler 	}
721c1d93b05SSam Leffler 
72269462a82SBruce M Simpson 	/*
72369462a82SBruce M Simpson 	 * Reset layer specific mbuf flags to avoid confusing upper layers.
72469462a82SBruce M Simpson 	 * Strip off Ethernet header.
72569462a82SBruce M Simpson 	 */
72669462a82SBruce M Simpson 	m->m_flags &= ~M_VLANTAG;
72786bd0491SAndre Oppermann 	m_clrprotoflags(m);
728797f247bSMatthew N. Dodd 	m_adj(m, ETHER_HDR_LEN);
729c1d93b05SSam Leffler 
73069462a82SBruce M Simpson 	/*
73169462a82SBruce M Simpson 	 * Dispatch frame to upper layer.
73269462a82SBruce M Simpson 	 */
733307d80beSDavid Greenman 	switch (ether_type) {
734df8bae1dSRodney W. Grimes #ifdef INET
735df8bae1dSRodney W. Grimes 	case ETHERTYPE_IP:
7365d691e6dSAndre Oppermann 		if ((m = ip_fastforward(m)) == NULL)
7371f91d8c5SDavid Greenman 			return;
7381cafed39SJonathan Lemon 		isr = NETISR_IP;
739df8bae1dSRodney W. Grimes 		break;
740df8bae1dSRodney W. Grimes 
741df8bae1dSRodney W. Grimes 	case ETHERTYPE_ARP:
74208aadfbbSJonathan Lemon 		if (ifp->if_flags & IFF_NOARP) {
74308aadfbbSJonathan Lemon 			/* Discard packet if ARP is disabled on interface */
74408aadfbbSJonathan Lemon 			m_freem(m);
74508aadfbbSJonathan Lemon 			return;
74608aadfbbSJonathan Lemon 		}
7471cafed39SJonathan Lemon 		isr = NETISR_ARP;
748df8bae1dSRodney W. Grimes 		break;
749df8bae1dSRodney W. Grimes #endif
75082cd038dSYoshinobu Inoue #ifdef INET6
75182cd038dSYoshinobu Inoue 	case ETHERTYPE_IPV6:
7521cafed39SJonathan Lemon 		isr = NETISR_IPV6;
75382cd038dSYoshinobu Inoue 		break;
75482cd038dSYoshinobu Inoue #endif
755df8bae1dSRodney W. Grimes 	default:
7561cafed39SJonathan Lemon 		goto discard;
757df8bae1dSRodney W. Grimes 	}
7581cafed39SJonathan Lemon 	netisr_dispatch(isr, m);
759c1d93b05SSam Leffler 	return;
7601cafed39SJonathan Lemon 
761c1d93b05SSam Leffler discard:
762c1d93b05SSam Leffler 	/*
763c1d93b05SSam Leffler 	 * Packet is to be discarded.  If netgraph is present,
764c1d93b05SSam Leffler 	 * hand the packet to it for last chance processing;
765c1d93b05SSam Leffler 	 * otherwise dispose of it.
766c1d93b05SSam Leffler 	 */
767833e8dc5SGleb Smirnoff 	if (ifp->if_l2com != NULL) {
768514bcb89SPoul-Henning Kamp 		KASSERT(ng_ether_input_orphan_p != NULL,
769514bcb89SPoul-Henning Kamp 		    ("ng_ether_input_orphan_p is NULL"));
770c1d93b05SSam Leffler 		/*
771c1d93b05SSam Leffler 		 * Put back the ethernet header so netgraph has a
772c1d93b05SSam Leffler 		 * consistent view of inbound packets.
773c1d93b05SSam Leffler 		 */
774eb1b1807SGleb Smirnoff 		M_PREPEND(m, ETHER_HDR_LEN, M_NOWAIT);
775c1d93b05SSam Leffler 		(*ng_ether_input_orphan_p)(ifp, m);
776c1d93b05SSam Leffler 		return;
777c1d93b05SSam Leffler 	}
778c1d93b05SSam Leffler 	m_freem(m);
779c1d93b05SSam Leffler }
780c1d93b05SSam Leffler 
781c1d93b05SSam Leffler /*
782c1d93b05SSam Leffler  * Convert Ethernet address to printable (loggable) representation.
783c1d93b05SSam Leffler  * This routine is for compatibility; it's better to just use
784c1d93b05SSam Leffler  *
785c1d93b05SSam Leffler  *	printf("%6D", <pointer to address>, ":");
786c1d93b05SSam Leffler  *
787c1d93b05SSam Leffler  * since there's no static buffer involved.
788c1d93b05SSam Leffler  */
789c1d93b05SSam Leffler char *
790c1d93b05SSam Leffler ether_sprintf(const u_char *ap)
791c1d93b05SSam Leffler {
792c1d93b05SSam Leffler 	static char etherbuf[18];
793c1d93b05SSam Leffler 	snprintf(etherbuf, sizeof (etherbuf), "%6D", ap, ":");
794c1d93b05SSam Leffler 	return (etherbuf);
795df8bae1dSRodney W. Grimes }
796df8bae1dSRodney W. Grimes 
797df8bae1dSRodney W. Grimes /*
798df8bae1dSRodney W. Grimes  * Perform common duties while attaching to interface list
799df8bae1dSRodney W. Grimes  */
800df8bae1dSRodney W. Grimes void
801d09ed26fSRuslan Ermilov ether_ifattach(struct ifnet *ifp, const u_int8_t *lla)
802df8bae1dSRodney W. Grimes {
803f93dfa28SBrooks Davis 	int i;
804098a8c3bSMatthew N. Dodd 	struct ifaddr *ifa;
805098a8c3bSMatthew N. Dodd 	struct sockaddr_dl *sdl;
806df8bae1dSRodney W. Grimes 
807c1d93b05SSam Leffler 	ifp->if_addrlen = ETHER_ADDR_LEN;
808c1d93b05SSam Leffler 	ifp->if_hdrlen = ETHER_HDR_LEN;
809cfeff1b6SJonathan Lemon 	if_attach(ifp);
810df8bae1dSRodney W. Grimes 	ifp->if_mtu = ETHERMTU;
811c1d93b05SSam Leffler 	ifp->if_output = ether_output;
812c1d93b05SSam Leffler 	ifp->if_input = ether_input;
8131158dfb7SGarrett Wollman 	ifp->if_resolvemulti = ether_resolvemulti;
814d3c351c5SMarko Zec #ifdef VIMAGE
815d3c351c5SMarko Zec 	ifp->if_reassign = ether_reassign;
816d3c351c5SMarko Zec #endif
817a330e1f1SGary Palmer 	if (ifp->if_baudrate == 0)
818c1d93b05SSam Leffler 		ifp->if_baudrate = IF_Mbps(10);		/* just a default */
819322dcb8dSMax Khon 	ifp->if_broadcastaddr = etherbroadcastaddr;
820c1d93b05SSam Leffler 
8214a0d6638SRuslan Ermilov 	ifa = ifp->if_addr;
8226e551fb6SDavid E. O'Brien 	KASSERT(ifa != NULL, ("%s: no lladdr!\n", __func__));
82359562606SGarrett Wollman 	sdl = (struct sockaddr_dl *)ifa->ifa_addr;
824df8bae1dSRodney W. Grimes 	sdl->sdl_type = IFT_ETHER;
825df8bae1dSRodney W. Grimes 	sdl->sdl_alen = ifp->if_addrlen;
826d09ed26fSRuslan Ermilov 	bcopy(lla, LLADDR(sdl), ifp->if_addrlen);
827c1d93b05SSam Leffler 
828797f247bSMatthew N. Dodd 	bpfattach(ifp, DLT_EN10MB, ETHER_HDR_LEN);
829e1e1452dSArchie Cobbs 	if (ng_ether_attach_p != NULL)
830e1e1452dSArchie Cobbs 		(*ng_ether_attach_p)(ifp);
831e3bbbec2SMatthew N. Dodd 
832f93dfa28SBrooks Davis 	/* Announce Ethernet MAC address if non-zero. */
833f93dfa28SBrooks Davis 	for (i = 0; i < ifp->if_addrlen; i++)
834d09ed26fSRuslan Ermilov 		if (lla[i] != 0)
835f93dfa28SBrooks Davis 			break;
836f93dfa28SBrooks Davis 	if (i != ifp->if_addrlen)
837d09ed26fSRuslan Ermilov 		if_printf(ifp, "Ethernet address: %6D\n", lla, ":");
838ef1f9169SMarcel Moolenaar 
839ef1f9169SMarcel Moolenaar 	uuid_ether_add(LLADDR(sdl));
840e1e1452dSArchie Cobbs }
841e1e1452dSArchie Cobbs 
84221b8ebd9SArchie Cobbs /*
84321b8ebd9SArchie Cobbs  * Perform common duties while detaching an Ethernet interface
84421b8ebd9SArchie Cobbs  */
84521b8ebd9SArchie Cobbs void
846c1d93b05SSam Leffler ether_ifdetach(struct ifnet *ifp)
84721b8ebd9SArchie Cobbs {
848ef1f9169SMarcel Moolenaar 	struct sockaddr_dl *sdl;
849ef1f9169SMarcel Moolenaar 
850ef1f9169SMarcel Moolenaar 	sdl = (struct sockaddr_dl *)(ifp->if_addr->ifa_addr);
851ef1f9169SMarcel Moolenaar 	uuid_ether_del(LLADDR(sdl));
852ef1f9169SMarcel Moolenaar 
853833e8dc5SGleb Smirnoff 	if (ifp->if_l2com != NULL) {
854514bcb89SPoul-Henning Kamp 		KASSERT(ng_ether_detach_p != NULL,
855514bcb89SPoul-Henning Kamp 		    ("ng_ether_detach_p is NULL"));
85621b8ebd9SArchie Cobbs 		(*ng_ether_detach_p)(ifp);
857514bcb89SPoul-Henning Kamp 	}
85820a65f37SAndrew Thompson 
85921b8ebd9SArchie Cobbs 	bpfdetach(ifp);
86021b8ebd9SArchie Cobbs 	if_detach(ifp);
86121b8ebd9SArchie Cobbs }
86221b8ebd9SArchie Cobbs 
863d3c351c5SMarko Zec #ifdef VIMAGE
864d3c351c5SMarko Zec void
865d3c351c5SMarko Zec ether_reassign(struct ifnet *ifp, struct vnet *new_vnet, char *unused __unused)
866d3c351c5SMarko Zec {
867d3c351c5SMarko Zec 
868833e8dc5SGleb Smirnoff 	if (ifp->if_l2com != NULL) {
869d3c351c5SMarko Zec 		KASSERT(ng_ether_detach_p != NULL,
870d3c351c5SMarko Zec 		    ("ng_ether_detach_p is NULL"));
871d3c351c5SMarko Zec 		(*ng_ether_detach_p)(ifp);
872d3c351c5SMarko Zec 	}
873d3c351c5SMarko Zec 
874d3c351c5SMarko Zec 	if (ng_ether_attach_p != NULL) {
875d3c351c5SMarko Zec 		CURVNET_SET_QUIET(new_vnet);
876d3c351c5SMarko Zec 		(*ng_ether_attach_p)(ifp);
877d3c351c5SMarko Zec 		CURVNET_RESTORE();
878d3c351c5SMarko Zec 	}
879d3c351c5SMarko Zec }
880d3c351c5SMarko Zec #endif
881d3c351c5SMarko Zec 
882ce02431fSDoug Rabson SYSCTL_DECL(_net_link);
883602d513cSGarrett Wollman SYSCTL_NODE(_net_link, IFT_ETHER, ether, CTLFLAG_RW, 0, "Ethernet");
88430106f6aSPoul-Henning Kamp 
88516b4a343SChristian Weisgerber #if 0
88616b4a343SChristian Weisgerber /*
88716b4a343SChristian Weisgerber  * This is for reference.  We have a table-driven version
88816b4a343SChristian Weisgerber  * of the little-endian crc32 generator, which is faster
88916b4a343SChristian Weisgerber  * than the double-loop.
89016b4a343SChristian Weisgerber  */
89116b4a343SChristian Weisgerber uint32_t
89216b4a343SChristian Weisgerber ether_crc32_le(const uint8_t *buf, size_t len)
89316b4a343SChristian Weisgerber {
89416b4a343SChristian Weisgerber 	size_t i;
89516b4a343SChristian Weisgerber 	uint32_t crc;
89616b4a343SChristian Weisgerber 	int bit;
89716b4a343SChristian Weisgerber 	uint8_t data;
89816b4a343SChristian Weisgerber 
89916b4a343SChristian Weisgerber 	crc = 0xffffffff;	/* initial value */
90016b4a343SChristian Weisgerber 
90116b4a343SChristian Weisgerber 	for (i = 0; i < len; i++) {
902933dad75SAntoine Brodin 		for (data = *buf++, bit = 0; bit < 8; bit++, data >>= 1) {
90316b4a343SChristian Weisgerber 			carry = (crc ^ data) & 1;
90416b4a343SChristian Weisgerber 			crc >>= 1;
90516b4a343SChristian Weisgerber 			if (carry)
90616b4a343SChristian Weisgerber 				crc = (crc ^ ETHER_CRC_POLY_LE);
90716b4a343SChristian Weisgerber 		}
908933dad75SAntoine Brodin 	}
90916b4a343SChristian Weisgerber 
91016b4a343SChristian Weisgerber 	return (crc);
91116b4a343SChristian Weisgerber }
91216b4a343SChristian Weisgerber #else
91316b4a343SChristian Weisgerber uint32_t
91416b4a343SChristian Weisgerber ether_crc32_le(const uint8_t *buf, size_t len)
91516b4a343SChristian Weisgerber {
91616b4a343SChristian Weisgerber 	static const uint32_t crctab[] = {
91716b4a343SChristian Weisgerber 		0x00000000, 0x1db71064, 0x3b6e20c8, 0x26d930ac,
91816b4a343SChristian Weisgerber 		0x76dc4190, 0x6b6b51f4, 0x4db26158, 0x5005713c,
91916b4a343SChristian Weisgerber 		0xedb88320, 0xf00f9344, 0xd6d6a3e8, 0xcb61b38c,
92016b4a343SChristian Weisgerber 		0x9b64c2b0, 0x86d3d2d4, 0xa00ae278, 0xbdbdf21c
92116b4a343SChristian Weisgerber 	};
92216b4a343SChristian Weisgerber 	size_t i;
92316b4a343SChristian Weisgerber 	uint32_t crc;
92416b4a343SChristian Weisgerber 
92516b4a343SChristian Weisgerber 	crc = 0xffffffff;	/* initial value */
92616b4a343SChristian Weisgerber 
92716b4a343SChristian Weisgerber 	for (i = 0; i < len; i++) {
92816b4a343SChristian Weisgerber 		crc ^= buf[i];
92916b4a343SChristian Weisgerber 		crc = (crc >> 4) ^ crctab[crc & 0xf];
93016b4a343SChristian Weisgerber 		crc = (crc >> 4) ^ crctab[crc & 0xf];
93116b4a343SChristian Weisgerber 	}
93216b4a343SChristian Weisgerber 
93316b4a343SChristian Weisgerber 	return (crc);
93416b4a343SChristian Weisgerber }
93516b4a343SChristian Weisgerber #endif
93616b4a343SChristian Weisgerber 
93716b4a343SChristian Weisgerber uint32_t
93816b4a343SChristian Weisgerber ether_crc32_be(const uint8_t *buf, size_t len)
93916b4a343SChristian Weisgerber {
94016b4a343SChristian Weisgerber 	size_t i;
94116b4a343SChristian Weisgerber 	uint32_t crc, carry;
94216b4a343SChristian Weisgerber 	int bit;
94316b4a343SChristian Weisgerber 	uint8_t data;
94416b4a343SChristian Weisgerber 
94516b4a343SChristian Weisgerber 	crc = 0xffffffff;	/* initial value */
94616b4a343SChristian Weisgerber 
94716b4a343SChristian Weisgerber 	for (i = 0; i < len; i++) {
94816b4a343SChristian Weisgerber 		for (data = *buf++, bit = 0; bit < 8; bit++, data >>= 1) {
94916b4a343SChristian Weisgerber 			carry = ((crc & 0x80000000) ? 1 : 0) ^ (data & 0x01);
95016b4a343SChristian Weisgerber 			crc <<= 1;
95116b4a343SChristian Weisgerber 			if (carry)
95216b4a343SChristian Weisgerber 				crc = (crc ^ ETHER_CRC_POLY_BE) | carry;
95316b4a343SChristian Weisgerber 		}
95416b4a343SChristian Weisgerber 	}
95516b4a343SChristian Weisgerber 
95616b4a343SChristian Weisgerber 	return (crc);
95716b4a343SChristian Weisgerber }
95816b4a343SChristian Weisgerber 
959fb583156SDavid Greenman int
960995c7fd1SYaroslav Tykhiy ether_ioctl(struct ifnet *ifp, u_long command, caddr_t data)
96130106f6aSPoul-Henning Kamp {
96230106f6aSPoul-Henning Kamp 	struct ifaddr *ifa = (struct ifaddr *) data;
96330106f6aSPoul-Henning Kamp 	struct ifreq *ifr = (struct ifreq *) data;
964fb583156SDavid Greenman 	int error = 0;
96530106f6aSPoul-Henning Kamp 
96630106f6aSPoul-Henning Kamp 	switch (command) {
96730106f6aSPoul-Henning Kamp 	case SIOCSIFADDR:
96830106f6aSPoul-Henning Kamp 		ifp->if_flags |= IFF_UP;
96930106f6aSPoul-Henning Kamp 
97030106f6aSPoul-Henning Kamp 		switch (ifa->ifa_addr->sa_family) {
97130106f6aSPoul-Henning Kamp #ifdef INET
97230106f6aSPoul-Henning Kamp 		case AF_INET:
97330106f6aSPoul-Henning Kamp 			ifp->if_init(ifp->if_softc);	/* before arpwhohas */
974322dcb8dSMax Khon 			arp_ifinit(ifp, ifa);
97530106f6aSPoul-Henning Kamp 			break;
97630106f6aSPoul-Henning Kamp #endif
97730106f6aSPoul-Henning Kamp 		default:
97830106f6aSPoul-Henning Kamp 			ifp->if_init(ifp->if_softc);
97930106f6aSPoul-Henning Kamp 			break;
98030106f6aSPoul-Henning Kamp 		}
98130106f6aSPoul-Henning Kamp 		break;
98230106f6aSPoul-Henning Kamp 
98330106f6aSPoul-Henning Kamp 	case SIOCGIFADDR:
98430106f6aSPoul-Henning Kamp 		{
98530106f6aSPoul-Henning Kamp 			struct sockaddr *sa;
98630106f6aSPoul-Henning Kamp 
98730106f6aSPoul-Henning Kamp 			sa = (struct sockaddr *) & ifr->ifr_data;
9884a0d6638SRuslan Ermilov 			bcopy(IF_LLADDR(ifp),
98930106f6aSPoul-Henning Kamp 			      (caddr_t) sa->sa_data, ETHER_ADDR_LEN);
99030106f6aSPoul-Henning Kamp 		}
99130106f6aSPoul-Henning Kamp 		break;
992fb583156SDavid Greenman 
993fb583156SDavid Greenman 	case SIOCSIFMTU:
994fb583156SDavid Greenman 		/*
995fb583156SDavid Greenman 		 * Set the interface MTU.
996fb583156SDavid Greenman 		 */
997fb583156SDavid Greenman 		if (ifr->ifr_mtu > ETHERMTU) {
998fb583156SDavid Greenman 			error = EINVAL;
999fb583156SDavid Greenman 		} else {
1000fb583156SDavid Greenman 			ifp->if_mtu = ifr->ifr_mtu;
100130106f6aSPoul-Henning Kamp 		}
1002fb583156SDavid Greenman 		break;
1003c1d93b05SSam Leffler 	default:
1004c1d93b05SSam Leffler 		error = EINVAL;			/* XXX netbsd has ENOTTY??? */
1005c1d93b05SSam Leffler 		break;
1006fb583156SDavid Greenman 	}
1007fb583156SDavid Greenman 	return (error);
100830106f6aSPoul-Henning Kamp }
10091158dfb7SGarrett Wollman 
101037c84183SPoul-Henning Kamp static int
101172fd1b6aSDag-Erling Smørgrav ether_resolvemulti(struct ifnet *ifp, struct sockaddr **llsa,
101272fd1b6aSDag-Erling Smørgrav 	struct sockaddr *sa)
10131158dfb7SGarrett Wollman {
10141158dfb7SGarrett Wollman 	struct sockaddr_dl *sdl;
1015d7647d96SDag-Erling Smørgrav #ifdef INET
10161158dfb7SGarrett Wollman 	struct sockaddr_in *sin;
1017d7647d96SDag-Erling Smørgrav #endif
101882cd038dSYoshinobu Inoue #ifdef INET6
101982cd038dSYoshinobu Inoue 	struct sockaddr_in6 *sin6;
102082cd038dSYoshinobu Inoue #endif
10211158dfb7SGarrett Wollman 	u_char *e_addr;
10221158dfb7SGarrett Wollman 
10231158dfb7SGarrett Wollman 	switch(sa->sa_family) {
10241158dfb7SGarrett Wollman 	case AF_LINK:
10257f33a738SJulian Elischer 		/*
10267f33a738SJulian Elischer 		 * No mapping needed. Just check that it's a valid MC address.
10277f33a738SJulian Elischer 		 */
10281158dfb7SGarrett Wollman 		sdl = (struct sockaddr_dl *)sa;
10291158dfb7SGarrett Wollman 		e_addr = LLADDR(sdl);
1030086e98c4SBruce M Simpson 		if (!ETHER_IS_MULTICAST(e_addr))
10311158dfb7SGarrett Wollman 			return EADDRNOTAVAIL;
10321158dfb7SGarrett Wollman 		*llsa = 0;
10331158dfb7SGarrett Wollman 		return 0;
10341158dfb7SGarrett Wollman 
10351158dfb7SGarrett Wollman #ifdef INET
10361158dfb7SGarrett Wollman 	case AF_INET:
10371158dfb7SGarrett Wollman 		sin = (struct sockaddr_in *)sa;
10381158dfb7SGarrett Wollman 		if (!IN_MULTICAST(ntohl(sin->sin_addr.s_addr)))
10391158dfb7SGarrett Wollman 			return EADDRNOTAVAIL;
104095fbe4d0SAlexander V. Chernikov 		sdl = link_init_sdl(ifp, *llsa, IFT_ETHER);
10411158dfb7SGarrett Wollman 		sdl->sdl_alen = ETHER_ADDR_LEN;
10421158dfb7SGarrett Wollman 		e_addr = LLADDR(sdl);
10431158dfb7SGarrett Wollman 		ETHER_MAP_IP_MULTICAST(&sin->sin_addr, e_addr);
10441158dfb7SGarrett Wollman 		*llsa = (struct sockaddr *)sdl;
10451158dfb7SGarrett Wollman 		return 0;
10461158dfb7SGarrett Wollman #endif
104782cd038dSYoshinobu Inoue #ifdef INET6
104882cd038dSYoshinobu Inoue 	case AF_INET6:
104982cd038dSYoshinobu Inoue 		sin6 = (struct sockaddr_in6 *)sa;
1050595b8a1cSJun-ichiro itojun Hagino 		if (IN6_IS_ADDR_UNSPECIFIED(&sin6->sin6_addr)) {
1051595b8a1cSJun-ichiro itojun Hagino 			/*
1052595b8a1cSJun-ichiro itojun Hagino 			 * An IP6 address of 0 means listen to all
1053595b8a1cSJun-ichiro itojun Hagino 			 * of the Ethernet multicast address used for IP6.
1054595b8a1cSJun-ichiro itojun Hagino 			 * (This is used for multicast routers.)
1055595b8a1cSJun-ichiro itojun Hagino 			 */
1056595b8a1cSJun-ichiro itojun Hagino 			ifp->if_flags |= IFF_ALLMULTI;
1057595b8a1cSJun-ichiro itojun Hagino 			*llsa = 0;
1058595b8a1cSJun-ichiro itojun Hagino 			return 0;
1059595b8a1cSJun-ichiro itojun Hagino 		}
106082cd038dSYoshinobu Inoue 		if (!IN6_IS_ADDR_MULTICAST(&sin6->sin6_addr))
106182cd038dSYoshinobu Inoue 			return EADDRNOTAVAIL;
106295fbe4d0SAlexander V. Chernikov 		sdl = link_init_sdl(ifp, *llsa, IFT_ETHER);
106382cd038dSYoshinobu Inoue 		sdl->sdl_alen = ETHER_ADDR_LEN;
106482cd038dSYoshinobu Inoue 		e_addr = LLADDR(sdl);
106582cd038dSYoshinobu Inoue 		ETHER_MAP_IPV6_MULTICAST(&sin6->sin6_addr, e_addr);
106682cd038dSYoshinobu Inoue 		*llsa = (struct sockaddr *)sdl;
106782cd038dSYoshinobu Inoue 		return 0;
106882cd038dSYoshinobu Inoue #endif
10691158dfb7SGarrett Wollman 
10701158dfb7SGarrett Wollman 	default:
10711158dfb7SGarrett Wollman 		/*
10721158dfb7SGarrett Wollman 		 * Well, the text isn't quite right, but it's the name
10731158dfb7SGarrett Wollman 		 * that counts...
10741158dfb7SGarrett Wollman 		 */
10751158dfb7SGarrett Wollman 		return EAFNOSUPPORT;
10761158dfb7SGarrett Wollman 	}
10771158dfb7SGarrett Wollman }
107840811c14SMatthew N. Dodd 
107940811c14SMatthew N. Dodd static moduledata_t ether_mod = {
1080833e8dc5SGleb Smirnoff 	.name = "ether",
108140811c14SMatthew N. Dodd };
108240811c14SMatthew N. Dodd 
108352f1277eSChristian S.J. Peron void
108452f1277eSChristian S.J. Peron ether_vlan_mtap(struct bpf_if *bp, struct mbuf *m, void *data, u_int dlen)
108552f1277eSChristian S.J. Peron {
108652f1277eSChristian S.J. Peron 	struct ether_vlan_header vlan;
108752f1277eSChristian S.J. Peron 	struct mbuf mv, mb;
108852f1277eSChristian S.J. Peron 
108952f1277eSChristian S.J. Peron 	KASSERT((m->m_flags & M_VLANTAG) != 0,
109052f1277eSChristian S.J. Peron 	    ("%s: vlan information not present", __func__));
109152f1277eSChristian S.J. Peron 	KASSERT(m->m_len >= sizeof(struct ether_header),
109252f1277eSChristian S.J. Peron 	    ("%s: mbuf not large enough for header", __func__));
109352f1277eSChristian S.J. Peron 	bcopy(mtod(m, char *), &vlan, sizeof(struct ether_header));
109452f1277eSChristian S.J. Peron 	vlan.evl_proto = vlan.evl_encap_proto;
109552f1277eSChristian S.J. Peron 	vlan.evl_encap_proto = htons(ETHERTYPE_VLAN);
109652f1277eSChristian S.J. Peron 	vlan.evl_tag = htons(m->m_pkthdr.ether_vtag);
109752f1277eSChristian S.J. Peron 	m->m_len -= sizeof(struct ether_header);
109852f1277eSChristian S.J. Peron 	m->m_data += sizeof(struct ether_header);
109952f1277eSChristian S.J. Peron 	/*
110052f1277eSChristian S.J. Peron 	 * If a data link has been supplied by the caller, then we will need to
110152f1277eSChristian S.J. Peron 	 * re-create a stack allocated mbuf chain with the following structure:
110252f1277eSChristian S.J. Peron 	 *
110352f1277eSChristian S.J. Peron 	 * (1) mbuf #1 will contain the supplied data link
110452f1277eSChristian S.J. Peron 	 * (2) mbuf #2 will contain the vlan header
110552f1277eSChristian S.J. Peron 	 * (3) mbuf #3 will contain the original mbuf's packet data
110652f1277eSChristian S.J. Peron 	 *
110752f1277eSChristian S.J. Peron 	 * Otherwise, submit the packet and vlan header via bpf_mtap2().
110852f1277eSChristian S.J. Peron 	 */
110952f1277eSChristian S.J. Peron 	if (data != NULL) {
111052f1277eSChristian S.J. Peron 		mv.m_next = m;
111152f1277eSChristian S.J. Peron 		mv.m_data = (caddr_t)&vlan;
111252f1277eSChristian S.J. Peron 		mv.m_len = sizeof(vlan);
111352f1277eSChristian S.J. Peron 		mb.m_next = &mv;
111452f1277eSChristian S.J. Peron 		mb.m_data = data;
111552f1277eSChristian S.J. Peron 		mb.m_len = dlen;
111652f1277eSChristian S.J. Peron 		bpf_mtap(bp, &mb);
111752f1277eSChristian S.J. Peron 	} else
111852f1277eSChristian S.J. Peron 		bpf_mtap2(bp, &vlan, sizeof(vlan), m);
111952f1277eSChristian S.J. Peron 	m->m_len += sizeof(struct ether_header);
112052f1277eSChristian S.J. Peron 	m->m_data -= sizeof(struct ether_header);
112152f1277eSChristian S.J. Peron }
112252f1277eSChristian S.J. Peron 
112360e87ca8SAndrew Thompson struct mbuf *
1124a0cf8186SAndrew Thompson ether_vlanencap(struct mbuf *m, uint16_t tag)
112560e87ca8SAndrew Thompson {
112660e87ca8SAndrew Thompson 	struct ether_vlan_header *evl;
112760e87ca8SAndrew Thompson 
1128eb1b1807SGleb Smirnoff 	M_PREPEND(m, ETHER_VLAN_ENCAP_LEN, M_NOWAIT);
112960e87ca8SAndrew Thompson 	if (m == NULL)
113060e87ca8SAndrew Thompson 		return (NULL);
113160e87ca8SAndrew Thompson 	/* M_PREPEND takes care of m_len, m_pkthdr.len for us */
113260e87ca8SAndrew Thompson 
113360e87ca8SAndrew Thompson 	if (m->m_len < sizeof(*evl)) {
113460e87ca8SAndrew Thompson 		m = m_pullup(m, sizeof(*evl));
113560e87ca8SAndrew Thompson 		if (m == NULL)
113660e87ca8SAndrew Thompson 			return (NULL);
113760e87ca8SAndrew Thompson 	}
113860e87ca8SAndrew Thompson 
113960e87ca8SAndrew Thompson 	/*
114060e87ca8SAndrew Thompson 	 * Transform the Ethernet header into an Ethernet header
114160e87ca8SAndrew Thompson 	 * with 802.1Q encapsulation.
114260e87ca8SAndrew Thompson 	 */
114360e87ca8SAndrew Thompson 	evl = mtod(m, struct ether_vlan_header *);
114460e87ca8SAndrew Thompson 	bcopy((char *)evl + ETHER_VLAN_ENCAP_LEN,
114560e87ca8SAndrew Thompson 	    (char *)evl, ETHER_HDR_LEN - ETHER_TYPE_LEN);
114660e87ca8SAndrew Thompson 	evl->evl_encap_proto = htons(ETHERTYPE_VLAN);
114760e87ca8SAndrew Thompson 	evl->evl_tag = htons(tag);
114860e87ca8SAndrew Thompson 	return (m);
114960e87ca8SAndrew Thompson }
115060e87ca8SAndrew Thompson 
1151fc74a9f9SBrooks Davis DECLARE_MODULE(ether, ether_mod, SI_SUB_INIT_IF, SI_ORDER_ANY);
115240811c14SMatthew N. Dodd MODULE_VERSION(ether, 1);
1153