xref: /dragonfly/sys/net/bridge/if_bridge.c (revision 49781055)
1 /*
2  * Copyright 2001 Wasabi Systems, Inc.
3  * All rights reserved.
4  *
5  * Written by Jason R. Thorpe for Wasabi Systems, Inc.
6  *
7  * Redistribution and use in source and binary forms, with or without
8  * modification, are permitted provided that the following conditions
9  * are met:
10  * 1. Redistributions of source code must retain the above copyright
11  *    notice, this list of conditions and the following disclaimer.
12  * 2. Redistributions in binary form must reproduce the above copyright
13  *    notice, this list of conditions and the following disclaimer in the
14  *    documentation and/or other materials provided with the distribution.
15  * 3. All advertising materials mentioning features or use of this software
16  *    must display the following acknowledgement:
17  *	This product includes software developed for the NetBSD Project by
18  *	Wasabi Systems, Inc.
19  * 4. The name of Wasabi Systems, Inc. may not be used to endorse
20  *    or promote products derived from this software without specific prior
21  *    written permission.
22  *
23  * THIS SOFTWARE IS PROVIDED BY WASABI SYSTEMS, INC. ``AS IS'' AND
24  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
25  * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
26  * PURPOSE ARE DISCLAIMED.  IN NO EVENT SHALL WASABI SYSTEMS, INC
27  * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
28  * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
29  * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
30  * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
31  * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
32  * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
33  * POSSIBILITY OF SUCH DAMAGE.
34  */
35 
36 /*
37  * Copyright (c) 1999, 2000 Jason L. Wright (jason@thought.net)
38  * All rights reserved.
39  *
40  * Redistribution and use in source and binary forms, with or without
41  * modification, are permitted provided that the following conditions
42  * are met:
43  * 1. Redistributions of source code must retain the above copyright
44  *    notice, this list of conditions and the following disclaimer.
45  * 2. Redistributions in binary form must reproduce the above copyright
46  *    notice, this list of conditions and the following disclaimer in the
47  *    documentation and/or other materials provided with the distribution.
48  * 3. All advertising materials mentioning features or use of this software
49  *    must display the following acknowledgement:
50  *	This product includes software developed by Jason L. Wright
51  * 4. The name of the author may not be used to endorse or promote products
52  *    derived from this software without specific prior written permission.
53  *
54  * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS OR
55  * IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
56  * WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
57  * DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT,
58  * INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES
59  * (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR
60  * SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
61  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT,
62  * STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN
63  * ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
64  * POSSIBILITY OF SUCH DAMAGE.
65  *
66  * $OpenBSD: if_bridge.c,v 1.60 2001/06/15 03:38:33 itojun Exp $
67  * $NetBSD: if_bridge.c,v 1.31 2005/06/01 19:45:34 jdc Exp $
68  * $FreeBSD: src/sys/net/if_bridge.c,v 1.26 2005/10/13 23:05:55 thompsa Exp $
69  * $DragonFly: src/sys/net/bridge/if_bridge.c,v 1.5 2006/01/31 19:05:37 dillon Exp $
70  */
71 
72 /*
73  * Network interface bridge support.
74  *
75  * TODO:
76  *
77  *	- Currently only supports Ethernet-like interfaces (Ethernet,
78  *	  802.11, VLANs on Ethernet, etc.)  Figure out a nice way
79  *	  to bridge other types of interfaces (FDDI-FDDI, and maybe
80  *	  consider heterogenous bridges).
81  */
82 
83 #include <sys/cdefs.h>
84 
85 #include "opt_inet.h"
86 #include "opt_inet6.h"
87 
88 #include <sys/param.h>
89 #include <sys/mbuf.h>
90 #include <sys/malloc.h>
91 #include <sys/protosw.h>
92 #include <sys/systm.h>
93 #include <sys/time.h>
94 #include <sys/socket.h> /* for net/if.h */
95 #include <sys/sockio.h>
96 #include <sys/ctype.h>  /* string functions */
97 #include <sys/kernel.h>
98 #include <sys/random.h>
99 #include <sys/sysctl.h>
100 #include <sys/module.h>
101 #include <sys/proc.h>
102 #include <sys/lock.h>
103 #include <sys/thread.h>
104 #include <sys/thread2.h>
105 #include <sys/mpipe.h>
106 
107 #include <net/bpf.h>
108 #include <net/if.h>
109 #include <net/if_dl.h>
110 #include <net/if_types.h>
111 #include <net/if_var.h>
112 #include <net/pfil.h>
113 #include <net/ifq_var.h>
114 
115 #include <netinet/in.h> /* for struct arpcom */
116 #include <netinet/in_systm.h>
117 #include <netinet/in_var.h>
118 #include <netinet/ip.h>
119 #include <netinet/ip_var.h>
120 #ifdef INET6
121 #include <netinet/ip6.h>
122 #include <netinet6/ip6_var.h>
123 #endif
124 #include <netinet/if_ether.h> /* for struct arpcom */
125 #include <net/bridge/if_bridgevar.h>
126 #include <net/if_llc.h>
127 
128 #include <net/route.h>
129 #include <sys/in_cksum.h>
130 
131 /*
132  * Size of the route hash table.  Must be a power of two.
133  */
134 #ifndef BRIDGE_RTHASH_SIZE
135 #define	BRIDGE_RTHASH_SIZE		1024
136 #endif
137 
138 #define	BRIDGE_RTHASH_MASK		(BRIDGE_RTHASH_SIZE - 1)
139 
140 /*
141  * Maximum number of addresses to cache.
142  */
143 #ifndef BRIDGE_RTABLE_MAX
144 #define	BRIDGE_RTABLE_MAX		100
145 #endif
146 
147 /*
148  * Spanning tree defaults.
149  */
150 #define	BSTP_DEFAULT_MAX_AGE		(20 * 256)
151 #define	BSTP_DEFAULT_HELLO_TIME		(2 * 256)
152 #define	BSTP_DEFAULT_FORWARD_DELAY	(15 * 256)
153 #define	BSTP_DEFAULT_HOLD_TIME		(1 * 256)
154 #define	BSTP_DEFAULT_BRIDGE_PRIORITY	0x8000
155 #define	BSTP_DEFAULT_PORT_PRIORITY	0x80
156 #define	BSTP_DEFAULT_PATH_COST		55
157 
158 /*
159  * Timeout (in seconds) for entries learned dynamically.
160  */
161 #ifndef BRIDGE_RTABLE_TIMEOUT
162 #define	BRIDGE_RTABLE_TIMEOUT		(20 * 60)	/* same as ARP */
163 #endif
164 
165 /*
166  * Number of seconds between walks of the route list.
167  */
168 #ifndef BRIDGE_RTABLE_PRUNE_PERIOD
169 #define	BRIDGE_RTABLE_PRUNE_PERIOD	(5 * 60)
170 #endif
171 
172 extern	struct mbuf *(*bridge_input_p)(struct ifnet *, struct mbuf *);
173 extern	int (*bridge_output_p)(struct ifnet *, struct mbuf *,
174 		struct sockaddr *, struct rtentry *);
175 extern	void (*bridge_dn_p)(struct mbuf *, struct ifnet *);
176 extern	void (*bridge_detach_p)(struct ifnet *);
177 
178 int	bridge_rtable_prune_period = BRIDGE_RTABLE_PRUNE_PERIOD;
179 
180 int	bridge_clone_create(struct if_clone *, int);
181 void	bridge_clone_destroy(struct ifnet *);
182 
183 int	bridge_ioctl(struct ifnet *, u_long, caddr_t, struct ucred *);
184 
185 static void	bridge_init(void *);
186 void	bridge_stop(struct ifnet *, int);
187 void	bridge_start(struct ifnet *);
188 
189 void	bridge_forward(struct bridge_softc *, struct mbuf *m);
190 
191 void	bridge_timer(void *);
192 
193 void	bridge_broadcast(struct bridge_softc *, struct ifnet *, struct mbuf *,
194 	    int);
195 
196 int	bridge_rtupdate(struct bridge_softc *, const uint8_t *,
197 	    struct ifnet *, int, uint8_t);
198 struct ifnet *bridge_rtlookup(struct bridge_softc *, const uint8_t *);
199 void	bridge_rttrim(struct bridge_softc *);
200 void	bridge_rtage(struct bridge_softc *);
201 void	bridge_rtflush(struct bridge_softc *, int);
202 int	bridge_rtdaddr(struct bridge_softc *, const uint8_t *);
203 
204 int	bridge_rtable_init(struct bridge_softc *);
205 void	bridge_rtable_fini(struct bridge_softc *);
206 
207 struct bridge_rtnode *bridge_rtnode_lookup(struct bridge_softc *,
208 	    const uint8_t *);
209 int	bridge_rtnode_insert(struct bridge_softc *, struct bridge_rtnode *);
210 void	bridge_rtnode_destroy(struct bridge_softc *, struct bridge_rtnode *);
211 
212 struct bridge_iflist *bridge_lookup_member(struct bridge_softc *,
213 	    const char *name);
214 struct bridge_iflist *bridge_lookup_member_if(struct bridge_softc *,
215 	    struct ifnet *ifp);
216 void	bridge_delete_member(struct bridge_softc *, struct bridge_iflist *);
217 
218 int	bridge_ioctl_add(struct bridge_softc *, void *);
219 int	bridge_ioctl_del(struct bridge_softc *, void *);
220 int	bridge_ioctl_gifflags(struct bridge_softc *, void *);
221 int	bridge_ioctl_sifflags(struct bridge_softc *, void *);
222 int	bridge_ioctl_scache(struct bridge_softc *, void *);
223 int	bridge_ioctl_gcache(struct bridge_softc *, void *);
224 int	bridge_ioctl_gifs(struct bridge_softc *, void *);
225 int	bridge_ioctl_rts(struct bridge_softc *, void *);
226 int	bridge_ioctl_saddr(struct bridge_softc *, void *);
227 int	bridge_ioctl_sto(struct bridge_softc *, void *);
228 int	bridge_ioctl_gto(struct bridge_softc *, void *);
229 int	bridge_ioctl_daddr(struct bridge_softc *, void *);
230 int	bridge_ioctl_flush(struct bridge_softc *, void *);
231 int	bridge_ioctl_gpri(struct bridge_softc *, void *);
232 int	bridge_ioctl_spri(struct bridge_softc *, void *);
233 int	bridge_ioctl_ght(struct bridge_softc *, void *);
234 int	bridge_ioctl_sht(struct bridge_softc *, void *);
235 int	bridge_ioctl_gfd(struct bridge_softc *, void *);
236 int	bridge_ioctl_sfd(struct bridge_softc *, void *);
237 int	bridge_ioctl_gma(struct bridge_softc *, void *);
238 int	bridge_ioctl_sma(struct bridge_softc *, void *);
239 int	bridge_ioctl_sifprio(struct bridge_softc *, void *);
240 int	bridge_ioctl_sifcost(struct bridge_softc *, void *);
241 static int bridge_pfil(struct mbuf **, struct ifnet *, struct ifnet *, int);
242 static int bridge_ip_checkbasic(struct mbuf **mp);
243 # ifdef INET6
244 static int bridge_ip6_checkbasic(struct mbuf **mp);
245 # endif /* INET6 */
246 
247 SYSCTL_DECL(_net_link);
248 SYSCTL_NODE(_net_link, IFT_BRIDGE, bridge, CTLFLAG_RW, 0, "Bridge");
249 
250 static int pfil_bridge = 1; /* run pfil hooks on the bridge interface */
251 static int pfil_member = 1; /* run pfil hooks on the member interface */
252 SYSCTL_INT(_net_link_bridge, OID_AUTO, pfil_bridge, CTLFLAG_RW,
253     &pfil_bridge, 0, "Packet filter on the bridge interface");
254 SYSCTL_INT(_net_link_bridge, OID_AUTO, pfil_member, CTLFLAG_RW,
255     &pfil_member, 0, "Packet filter on the member interface");
256 
257 struct bridge_control {
258 	int	(*bc_func)(struct bridge_softc *, void *);
259 	int	bc_argsize;
260 	int	bc_flags;
261 };
262 
263 #define	BC_F_COPYIN		0x01	/* copy arguments in */
264 #define	BC_F_COPYOUT		0x02	/* copy arguments out */
265 #define	BC_F_SUSER		0x04	/* do super-user check */
266 
267 const struct bridge_control bridge_control_table[] = {
268 	{ bridge_ioctl_add,		sizeof(struct ifbreq),
269 	  BC_F_COPYIN|BC_F_SUSER },
270 	{ bridge_ioctl_del,		sizeof(struct ifbreq),
271 	  BC_F_COPYIN|BC_F_SUSER },
272 
273 	{ bridge_ioctl_gifflags,	sizeof(struct ifbreq),
274 	  BC_F_COPYIN|BC_F_COPYOUT },
275 	{ bridge_ioctl_sifflags,	sizeof(struct ifbreq),
276 	  BC_F_COPYIN|BC_F_SUSER },
277 
278 	{ bridge_ioctl_scache,		sizeof(struct ifbrparam),
279 	  BC_F_COPYIN|BC_F_SUSER },
280 	{ bridge_ioctl_gcache,		sizeof(struct ifbrparam),
281 	  BC_F_COPYOUT },
282 
283 	{ bridge_ioctl_gifs,		sizeof(struct ifbifconf),
284 	  BC_F_COPYIN|BC_F_COPYOUT },
285 	{ bridge_ioctl_rts,		sizeof(struct ifbaconf),
286 	  BC_F_COPYIN|BC_F_COPYOUT },
287 
288 	{ bridge_ioctl_saddr,		sizeof(struct ifbareq),
289 	  BC_F_COPYIN|BC_F_SUSER },
290 
291 	{ bridge_ioctl_sto,		sizeof(struct ifbrparam),
292 	  BC_F_COPYIN|BC_F_SUSER },
293 	{ bridge_ioctl_gto,		sizeof(struct ifbrparam),
294 	  BC_F_COPYOUT },
295 
296 	{ bridge_ioctl_daddr,		sizeof(struct ifbareq),
297 	  BC_F_COPYIN|BC_F_SUSER },
298 
299 	{ bridge_ioctl_flush,		sizeof(struct ifbreq),
300 	  BC_F_COPYIN|BC_F_SUSER },
301 
302 	{ bridge_ioctl_gpri,		sizeof(struct ifbrparam),
303 	  BC_F_COPYOUT },
304 	{ bridge_ioctl_spri,		sizeof(struct ifbrparam),
305 	  BC_F_COPYIN|BC_F_SUSER },
306 
307 	{ bridge_ioctl_ght,		sizeof(struct ifbrparam),
308 	  BC_F_COPYOUT },
309 	{ bridge_ioctl_sht,		sizeof(struct ifbrparam),
310 	  BC_F_COPYIN|BC_F_SUSER },
311 
312 	{ bridge_ioctl_gfd,		sizeof(struct ifbrparam),
313 	  BC_F_COPYOUT },
314 	{ bridge_ioctl_sfd,		sizeof(struct ifbrparam),
315 	  BC_F_COPYIN|BC_F_SUSER },
316 
317 	{ bridge_ioctl_gma,		sizeof(struct ifbrparam),
318 	  BC_F_COPYOUT },
319 	{ bridge_ioctl_sma,		sizeof(struct ifbrparam),
320 	  BC_F_COPYIN|BC_F_SUSER },
321 
322 	{ bridge_ioctl_sifprio,		sizeof(struct ifbreq),
323 	  BC_F_COPYIN|BC_F_SUSER },
324 
325 	{ bridge_ioctl_sifcost,		sizeof(struct ifbreq),
326 	  BC_F_COPYIN|BC_F_SUSER },
327 };
328 const int bridge_control_table_size =
329     sizeof(bridge_control_table) / sizeof(bridge_control_table[0]);
330 
331 static const u_char etherbroadcastaddr[ETHER_ADDR_LEN] =
332 			{ 0xff, 0xff, 0xff, 0xff, 0xff, 0xff };
333 
334 LIST_HEAD(, bridge_softc) bridge_list;
335 
336 struct if_clone bridge_cloner = IF_CLONE_INITIALIZER("bridge",
337                                 bridge_clone_create,
338 				bridge_clone_destroy, 0, IF_MAXUNIT);
339 
340 static int
341 bridge_modevent(module_t mod, int type, void *data)
342 {
343 
344 	switch (type) {
345 	case MOD_LOAD:
346 		LIST_INIT(&bridge_list);
347 		if_clone_attach(&bridge_cloner);
348 		bridge_input_p = bridge_input;
349 		bridge_output_p = bridge_output_serialized;
350 #if notyet
351 		bridge_detach_p = bridge_ifdetach;
352 		bstp_linkstate_p = bstp_linkstate;
353 #endif
354 		break;
355 	case MOD_UNLOAD:
356 		if (!LIST_EMPTY(&bridge_list))
357 			return EBUSY;
358 		if_clone_detach(&bridge_cloner);
359 		bridge_input_p = NULL;
360 		bridge_output_p = NULL;
361 #if notyet
362 		bridge_detach_p = NULL;
363 		bstp_linkstate_p = NULL;
364 #endif
365 		break;
366 	default:
367 		return EOPNOTSUPP;
368 	}
369 	return 0;
370 }
371 
372 static moduledata_t bridge_mod = {
373 	"if_bridge",
374 	bridge_modevent,
375 	0
376 };
377 
378 DECLARE_MODULE(if_bridge, bridge_mod, SI_SUB_PSEUDO, SI_ORDER_ANY);
379 
380 
381 /*
382  * bridge_clone_create:
383  *
384  *	Create a new bridge instance.
385  */
386 int
387 bridge_clone_create(struct if_clone *ifc, int unit)
388 {
389 	struct bridge_softc *sc;
390 	struct ifnet *ifp;
391 	u_char eaddr[6];
392 
393 	sc = malloc(sizeof(*sc), M_DEVBUF, M_WAITOK|M_ZERO);
394 	ifp = sc->sc_ifp = &sc->sc_if;
395 
396 	sc->sc_brtmax = BRIDGE_RTABLE_MAX;
397 	sc->sc_brttimeout = BRIDGE_RTABLE_TIMEOUT;
398 	sc->sc_bridge_max_age = BSTP_DEFAULT_MAX_AGE;
399 	sc->sc_bridge_hello_time = BSTP_DEFAULT_HELLO_TIME;
400 	sc->sc_bridge_forward_delay = BSTP_DEFAULT_FORWARD_DELAY;
401 	sc->sc_bridge_priority = BSTP_DEFAULT_BRIDGE_PRIORITY;
402 	sc->sc_hold_time = BSTP_DEFAULT_HOLD_TIME;
403 
404 	/* Initialize our routing table. */
405 	bridge_rtable_init(sc);
406 
407 	callout_init(&sc->sc_brcallout);
408 	callout_init(&sc->sc_bstpcallout);
409 
410 	LIST_INIT(&sc->sc_iflist);
411 
412 	ifp->if_softc = sc;
413 	if_initname(ifp, ifc->ifc_name, unit);
414 	ifp->if_mtu = ETHERMTU;
415 	ifp->if_flags = IFF_MULTICAST;
416 	ifp->if_ioctl = bridge_ioctl;
417 	ifp->if_start = bridge_start;
418 	ifp->if_init = bridge_init;
419 	ifp->if_type = IFT_BRIDGE;
420 	ifq_set_maxlen(&ifp->if_snd, ifqmaxlen);
421 	ifp->if_snd.ifq_maxlen = ifqmaxlen;
422 	ifq_set_ready(&ifp->if_snd);
423 	ifp->if_hdrlen = ETHER_HDR_LEN;
424 
425 	/*
426 	 * Generate a random ethernet address and use the private AC:DE:48
427 	 * OUI code.
428 	 */
429 	{
430 		int rnd = arc4random();
431 		bcopy(&rnd, &eaddr[2], 4); /* ETHER_ADDR_LEN == 6 */
432 	}
433 	eaddr[0] = 0xAC;
434 	eaddr[1] = 0xDE;
435 	eaddr[2] = 0x48;
436 
437 	ether_ifattach(ifp, eaddr, NULL);
438 	/* Now undo some of the damage... */
439 	ifp->if_baudrate = 0;
440 	ifp->if_type = IFT_BRIDGE;
441 
442 	crit_enter();
443 	LIST_INSERT_HEAD(&bridge_list, sc, sc_list);
444 	crit_exit();
445 
446 	return (0);
447 }
448 
449 /*
450  * bridge_clone_destroy:
451  *
452  *	Destroy a bridge instance.
453  */
454 void
455 bridge_clone_destroy(struct ifnet *ifp)
456 {
457 	struct bridge_softc *sc = ifp->if_softc;
458 	struct bridge_iflist *bif;
459 
460 	lwkt_serialize_enter(ifp->if_serializer);
461 
462 	bridge_stop(ifp, 1);
463 	ifp->if_flags &= ~IFF_UP;
464 
465 	while ((bif = LIST_FIRST(&sc->sc_iflist)) != NULL)
466 		bridge_delete_member(sc, bif);
467 
468 	callout_stop(&sc->sc_brcallout);
469 	callout_stop(&sc->sc_bstpcallout);
470 
471 	lwkt_serialize_exit(ifp->if_serializer);
472 
473 	crit_enter();
474 	LIST_REMOVE(sc, sc_list);
475 	crit_exit();
476 
477 	ether_ifdetach(ifp);
478 
479 
480 	/* Tear down the routing table. */
481 	bridge_rtable_fini(sc);
482 
483 	free(sc, M_DEVBUF);
484 }
485 
486 /*
487  * bridge_ioctl:
488  *
489  *	Handle a control request from the operator.
490  */
491 int
492 bridge_ioctl(struct ifnet *ifp, u_long cmd, caddr_t data, struct ucred *cr)
493 {
494 	struct bridge_softc *sc = ifp->if_softc;
495 	struct thread *td = curthread;
496 	union {
497 		struct ifbreq ifbreq;
498 		struct ifbifconf ifbifconf;
499 		struct ifbareq ifbareq;
500 		struct ifbaconf ifbaconf;
501 		struct ifbrparam ifbrparam;
502 	} args;
503 	struct ifdrv *ifd = (struct ifdrv *) data;
504 	const struct bridge_control *bc;
505 	int error = 0;
506 
507 	switch (cmd) {
508 
509 	case SIOCADDMULTI:
510 	case SIOCDELMULTI:
511 		break;
512 
513 	case SIOCGDRVSPEC:
514 	case SIOCSDRVSPEC:
515 		if (ifd->ifd_cmd >= bridge_control_table_size) {
516 			error = EINVAL;
517 			break;
518 		}
519 		bc = &bridge_control_table[ifd->ifd_cmd];
520 
521 		if (cmd == SIOCGDRVSPEC &&
522 		    (bc->bc_flags & BC_F_COPYOUT) == 0) {
523 			error = EINVAL;
524 			break;
525 		}
526 		else if (cmd == SIOCSDRVSPEC &&
527 		    (bc->bc_flags & BC_F_COPYOUT) != 0) {
528 			error = EINVAL;
529 			break;
530 		}
531 
532 		if (bc->bc_flags & BC_F_SUSER) {
533 			error = suser(td);
534 			if (error)
535 				break;
536 		}
537 
538 		if (ifd->ifd_len != bc->bc_argsize ||
539 		    ifd->ifd_len > sizeof(args)) {
540 			error = EINVAL;
541 			break;
542 		}
543 
544 		if (bc->bc_flags & BC_F_COPYIN) {
545 			error = copyin(ifd->ifd_data, &args, ifd->ifd_len);
546 			if (error)
547 				break;
548 		}
549 
550 		error = (*bc->bc_func)(sc, &args);
551 		if (error)
552 			break;
553 
554 		if (bc->bc_flags & BC_F_COPYOUT)
555 			error = copyout(&args, ifd->ifd_data, ifd->ifd_len);
556 
557 		break;
558 
559 	case SIOCSIFFLAGS:
560 		if (!(ifp->if_flags & IFF_UP) &&
561 		    (ifp->if_flags & IFF_RUNNING)) {
562 			/*
563 			 * If interface is marked down and it is running,
564 			 * then stop and disable it.
565 			 */
566 			bridge_stop(ifp, 1);
567 		} else if ((ifp->if_flags & IFF_UP) &&
568 		    !(ifp->if_flags & IFF_RUNNING)) {
569 			/*
570 			 * If interface is marked up and it is stopped, then
571 			 * start it.
572 			 */
573 			(*ifp->if_init)(sc);
574 		}
575 		break;
576 
577 	case SIOCSIFMTU:
578 		/* Do not allow the MTU to be changed on the bridge */
579 		error = EINVAL;
580 		break;
581 
582 	default:
583 		/*
584 		 * drop the lock as ether_ioctl() will call bridge_start() and
585 		 * cause the lock to be recursed.
586 		 */
587 		error = ether_ioctl(ifp, cmd, data);
588 		break;
589 	}
590 
591 	return (error);
592 }
593 
594 /*
595  * bridge_lookup_member:
596  *
597  *	Lookup a bridge member interface.
598  */
599 struct bridge_iflist *
600 bridge_lookup_member(struct bridge_softc *sc, const char *name)
601 {
602 	struct bridge_iflist *bif;
603 	struct ifnet *ifp;
604 
605 	LIST_FOREACH(bif, &sc->sc_iflist, bif_next) {
606 		ifp = bif->bif_ifp;
607 		if (strcmp(ifp->if_xname, name) == 0)
608 			return (bif);
609 	}
610 
611 	return (NULL);
612 }
613 
614 /*
615  * bridge_lookup_member_if:
616  *
617  *	Lookup a bridge member interface by ifnet*.
618  */
619 struct bridge_iflist *
620 bridge_lookup_member_if(struct bridge_softc *sc, struct ifnet *member_ifp)
621 {
622 	struct bridge_iflist *bif;
623 
624 	LIST_FOREACH(bif, &sc->sc_iflist, bif_next) {
625 		if (bif->bif_ifp == member_ifp)
626 			return (bif);
627 	}
628 
629 	return (NULL);
630 }
631 
632 /*
633  * bridge_delete_member:
634  *
635  *	Delete the specified member interface.
636  */
637 void
638 bridge_delete_member(struct bridge_softc *sc, struct bridge_iflist *bif)
639 {
640 	struct ifnet *ifs = bif->bif_ifp;
641 
642 	switch (ifs->if_type) {
643 	case IFT_ETHER:
644 	case IFT_L2VLAN:
645 		/*
646 		 * Take the interface out of promiscuous mode.
647 		 */
648 		ifpromisc(ifs, 0);
649 		break;
650 
651 	case IFT_GIF:
652 		break;
653 
654 	default:
655 #ifdef DIAGNOSTIC
656 		panic("bridge_delete_member: impossible");
657 #endif
658 		break;
659 	}
660 
661 	ifs->if_bridge = NULL;
662 
663 	LIST_REMOVE(bif, bif_next);
664 
665 	bridge_rtdelete(sc, ifs, IFBF_FLUSHALL);
666 
667 	free(bif, M_DEVBUF);
668 
669 	if (sc->sc_ifp->if_flags & IFF_RUNNING)
670 		bstp_initialization(sc);
671 }
672 
673 int
674 bridge_ioctl_add(struct bridge_softc *sc, void *arg)
675 {
676 	struct ifbreq *req = arg;
677 	struct bridge_iflist *bif = NULL;
678 	struct ifnet *ifs;
679 	int error = 0;
680 
681 	ifs = ifunit(req->ifbr_ifsname);
682 	if (ifs == NULL)
683 		return (ENOENT);
684 
685 	/* Allow the first member to define the MTU */
686 	if (LIST_EMPTY(&sc->sc_iflist))
687 		sc->sc_ifp->if_mtu = ifs->if_mtu;
688 	else if (sc->sc_ifp->if_mtu != ifs->if_mtu) {
689 		if_printf(sc->sc_ifp, "invalid MTU for %s\n", ifs->if_xname);
690 		return (EINVAL);
691 	}
692 
693 	if (ifs->if_bridge == sc)
694 		return (EEXIST);
695 
696 	if (ifs->if_bridge != NULL)
697 		return (EBUSY);
698 
699 	bif = malloc(sizeof(*bif), M_DEVBUF, M_NOWAIT);
700 	if (bif == NULL)
701 		return (ENOMEM);
702 
703 	switch (ifs->if_type) {
704 	case IFT_ETHER:
705 	case IFT_L2VLAN:
706 		/*
707 		 * Place the interface into promiscuous mode.
708 		 */
709 		error = ifpromisc(ifs, 1);
710 		if (error)
711 			goto out;
712 		break;
713 
714 	case IFT_GIF: /* :^) */
715 		break;
716 
717 	default:
718 		error = EINVAL;
719 		goto out;
720 	}
721 
722 	bif->bif_ifp = ifs;
723 	bif->bif_flags = IFBIF_LEARNING | IFBIF_DISCOVER;
724 	bif->bif_priority = BSTP_DEFAULT_PORT_PRIORITY;
725 	bif->bif_path_cost = BSTP_DEFAULT_PATH_COST;
726 
727 	ifs->if_bridge = sc;
728 
729 	LIST_INSERT_HEAD(&sc->sc_iflist, bif, bif_next);
730 
731 	if (sc->sc_ifp->if_flags & IFF_RUNNING)
732 		bstp_initialization(sc);
733 	else
734 		bstp_stop(sc);
735 
736  out:
737 	if (error) {
738 		if (bif != NULL)
739 			free(bif, M_DEVBUF);
740 	}
741 	return (error);
742 }
743 
744 int
745 bridge_ioctl_del(struct bridge_softc *sc, void *arg)
746 {
747 	struct ifbreq *req = arg;
748 	struct bridge_iflist *bif;
749 
750 	bif = bridge_lookup_member(sc, req->ifbr_ifsname);
751 	if (bif == NULL)
752 		return (ENOENT);
753 
754 	bridge_delete_member(sc, bif);
755 
756 	return (0);
757 }
758 
759 int
760 bridge_ioctl_gifflags(struct bridge_softc *sc, void *arg)
761 {
762 	struct ifbreq *req = arg;
763 	struct bridge_iflist *bif;
764 
765 	bif = bridge_lookup_member(sc, req->ifbr_ifsname);
766 	if (bif == NULL)
767 		return (ENOENT);
768 
769 	req->ifbr_ifsflags = bif->bif_flags;
770 	req->ifbr_state = bif->bif_state;
771 	req->ifbr_priority = bif->bif_priority;
772 	req->ifbr_path_cost = bif->bif_path_cost;
773 	req->ifbr_portno = bif->bif_ifp->if_index & 0xff;
774 
775 	return (0);
776 }
777 
778 int
779 bridge_ioctl_sifflags(struct bridge_softc *sc, void *arg)
780 {
781 	struct ifbreq *req = arg;
782 	struct bridge_iflist *bif;
783 
784 	bif = bridge_lookup_member(sc, req->ifbr_ifsname);
785 	if (bif == NULL)
786 		return (ENOENT);
787 
788 	if (req->ifbr_ifsflags & IFBIF_STP) {
789 		switch (bif->bif_ifp->if_type) {
790 		case IFT_ETHER:
791 			/* These can do spanning tree. */
792 			break;
793 
794 		default:
795 			/* Nothing else can. */
796 			return (EINVAL);
797 		}
798 	}
799 
800 	bif->bif_flags = req->ifbr_ifsflags;
801 
802 	if (sc->sc_ifp->if_flags & IFF_RUNNING)
803 		bstp_initialization(sc);
804 
805 	return (0);
806 }
807 
808 int
809 bridge_ioctl_scache(struct bridge_softc *sc, void *arg)
810 {
811 	struct ifbrparam *param = arg;
812 
813 	sc->sc_brtmax = param->ifbrp_csize;
814 	bridge_rttrim(sc);
815 
816 	return (0);
817 }
818 
819 int
820 bridge_ioctl_gcache(struct bridge_softc *sc, void *arg)
821 {
822 	struct ifbrparam *param = arg;
823 
824 	param->ifbrp_csize = sc->sc_brtmax;
825 
826 	return (0);
827 }
828 
829 int
830 bridge_ioctl_gifs(struct bridge_softc *sc, void *arg)
831 {
832 	struct ifbifconf *bifc = arg;
833 	struct bridge_iflist *bif;
834 	struct ifbreq breq;
835 	int count, len, error = 0;
836 
837 	count = 0;
838 	LIST_FOREACH(bif, &sc->sc_iflist, bif_next)
839 		count++;
840 
841 	if (bifc->ifbic_len == 0) {
842 		bifc->ifbic_len = sizeof(breq) * count;
843 		return (0);
844 	}
845 
846 	count = 0;
847 	len = bifc->ifbic_len;
848 	LIST_FOREACH(bif, &sc->sc_iflist, bif_next) {
849 		if (len < sizeof(breq))
850 			break;
851 
852 		strlcpy(breq.ifbr_ifsname, bif->bif_ifp->if_xname,
853 		    sizeof(breq.ifbr_ifsname));
854 		breq.ifbr_ifsflags = bif->bif_flags;
855 		breq.ifbr_state = bif->bif_state;
856 		breq.ifbr_priority = bif->bif_priority;
857 		breq.ifbr_path_cost = bif->bif_path_cost;
858 		breq.ifbr_portno = bif->bif_ifp->if_index & 0xff;
859 		error = copyout(&breq, bifc->ifbic_req + count, sizeof(breq));
860 		if (error)
861 			break;
862 		count++;
863 		len -= sizeof(breq);
864 	}
865 
866 	bifc->ifbic_len = sizeof(breq) * count;
867 	return (error);
868 }
869 
870 int
871 bridge_ioctl_rts(struct bridge_softc *sc, void *arg)
872 {
873 	struct ifbaconf *bac = arg;
874 	struct bridge_rtnode *brt;
875 	struct ifbareq bareq;
876 	int count = 0, error = 0, len;
877 
878 	if (bac->ifbac_len == 0)
879 		return (0);
880 
881 	len = bac->ifbac_len;
882 	LIST_FOREACH(brt, &sc->sc_rtlist, brt_list) {
883 		if (len < sizeof(bareq))
884 			goto out;
885 		strlcpy(bareq.ifba_ifsname, brt->brt_ifp->if_xname,
886 		    sizeof(bareq.ifba_ifsname));
887 		memcpy(bareq.ifba_dst, brt->brt_addr, sizeof(brt->brt_addr));
888 		if ((brt->brt_flags & IFBAF_TYPEMASK) == IFBAF_DYNAMIC &&
889 				time_second < brt->brt_expire)
890 			bareq.ifba_expire = brt->brt_expire - time_second;
891 		else
892 			bareq.ifba_expire = 0;
893 		bareq.ifba_flags = brt->brt_flags;
894 
895 		error = copyout(&bareq, bac->ifbac_req + count, sizeof(bareq));
896 		if (error)
897 			goto out;
898 		count++;
899 		len -= sizeof(bareq);
900 	}
901  out:
902 	bac->ifbac_len = sizeof(bareq) * count;
903 	return (error);
904 }
905 
906 int
907 bridge_ioctl_saddr(struct bridge_softc *sc, void *arg)
908 {
909 	struct ifbareq *req = arg;
910 	struct bridge_iflist *bif;
911 	int error;
912 
913 	bif = bridge_lookup_member(sc, req->ifba_ifsname);
914 	if (bif == NULL)
915 		return (ENOENT);
916 
917 	error = bridge_rtupdate(sc, req->ifba_dst, bif->bif_ifp, 1,
918 	    req->ifba_flags);
919 
920 	return (error);
921 }
922 
923 int
924 bridge_ioctl_sto(struct bridge_softc *sc, void *arg)
925 {
926 	struct ifbrparam *param = arg;
927 
928 	sc->sc_brttimeout = param->ifbrp_ctime;
929 
930 	return (0);
931 }
932 
933 int
934 bridge_ioctl_gto(struct bridge_softc *sc, void *arg)
935 {
936 	struct ifbrparam *param = arg;
937 
938 	param->ifbrp_ctime = sc->sc_brttimeout;
939 
940 	return (0);
941 }
942 
943 int
944 bridge_ioctl_daddr(struct bridge_softc *sc, void *arg)
945 {
946 	struct ifbareq *req = arg;
947 
948 	return (bridge_rtdaddr(sc, req->ifba_dst));
949 }
950 
951 int
952 bridge_ioctl_flush(struct bridge_softc *sc, void *arg)
953 {
954 	struct ifbreq *req = arg;
955 
956 	bridge_rtflush(sc, req->ifbr_ifsflags);
957 
958 	return (0);
959 }
960 
961 int
962 bridge_ioctl_gpri(struct bridge_softc *sc, void *arg)
963 {
964 	struct ifbrparam *param = arg;
965 
966 	param->ifbrp_prio = sc->sc_bridge_priority;
967 
968 	return (0);
969 }
970 
971 int
972 bridge_ioctl_spri(struct bridge_softc *sc, void *arg)
973 {
974 	struct ifbrparam *param = arg;
975 
976 	sc->sc_bridge_priority = param->ifbrp_prio;
977 
978 	if (sc->sc_ifp->if_flags & IFF_RUNNING)
979 		bstp_initialization(sc);
980 
981 	return (0);
982 }
983 
984 int
985 bridge_ioctl_ght(struct bridge_softc *sc, void *arg)
986 {
987 	struct ifbrparam *param = arg;
988 
989 	param->ifbrp_hellotime = sc->sc_bridge_hello_time >> 8;
990 
991 	return (0);
992 }
993 
994 int
995 bridge_ioctl_sht(struct bridge_softc *sc, void *arg)
996 {
997 	struct ifbrparam *param = arg;
998 
999 	if (param->ifbrp_hellotime == 0)
1000 		return (EINVAL);
1001 	sc->sc_bridge_hello_time = param->ifbrp_hellotime << 8;
1002 
1003 	if (sc->sc_ifp->if_flags & IFF_RUNNING)
1004 		bstp_initialization(sc);
1005 
1006 	return (0);
1007 }
1008 
1009 int
1010 bridge_ioctl_gfd(struct bridge_softc *sc, void *arg)
1011 {
1012 	struct ifbrparam *param = arg;
1013 
1014 	param->ifbrp_fwddelay = sc->sc_bridge_forward_delay >> 8;
1015 
1016 	return (0);
1017 }
1018 
1019 int
1020 bridge_ioctl_sfd(struct bridge_softc *sc, void *arg)
1021 {
1022 	struct ifbrparam *param = arg;
1023 
1024 	if (param->ifbrp_fwddelay == 0)
1025 		return (EINVAL);
1026 	sc->sc_bridge_forward_delay = param->ifbrp_fwddelay << 8;
1027 
1028 	if (sc->sc_ifp->if_flags & IFF_RUNNING)
1029 		bstp_initialization(sc);
1030 
1031 	return (0);
1032 }
1033 
1034 int
1035 bridge_ioctl_gma(struct bridge_softc *sc, void *arg)
1036 {
1037 	struct ifbrparam *param = arg;
1038 
1039 	param->ifbrp_maxage = sc->sc_bridge_max_age >> 8;
1040 
1041 	return (0);
1042 }
1043 
1044 int
1045 bridge_ioctl_sma(struct bridge_softc *sc, void *arg)
1046 {
1047 	struct ifbrparam *param = arg;
1048 
1049 	if (param->ifbrp_maxage == 0)
1050 		return (EINVAL);
1051 	sc->sc_bridge_max_age = param->ifbrp_maxage << 8;
1052 
1053 	if (sc->sc_ifp->if_flags & IFF_RUNNING)
1054 		bstp_initialization(sc);
1055 
1056 	return (0);
1057 }
1058 
1059 int
1060 bridge_ioctl_sifprio(struct bridge_softc *sc, void *arg)
1061 {
1062 	struct ifbreq *req = arg;
1063 	struct bridge_iflist *bif;
1064 
1065 	bif = bridge_lookup_member(sc, req->ifbr_ifsname);
1066 	if (bif == NULL)
1067 		return (ENOENT);
1068 
1069 	bif->bif_priority = req->ifbr_priority;
1070 
1071 	if (sc->sc_ifp->if_flags & IFF_RUNNING)
1072 		bstp_initialization(sc);
1073 
1074 	return (0);
1075 }
1076 
1077 int
1078 bridge_ioctl_sifcost(struct bridge_softc *sc, void *arg)
1079 {
1080 	struct ifbreq *req = arg;
1081 	struct bridge_iflist *bif;
1082 
1083 	bif = bridge_lookup_member(sc, req->ifbr_ifsname);
1084 	if (bif == NULL)
1085 		return (ENOENT);
1086 
1087 	bif->bif_path_cost = req->ifbr_path_cost;
1088 
1089 	if (sc->sc_ifp->if_flags & IFF_RUNNING)
1090 		bstp_initialization(sc);
1091 
1092 	return (0);
1093 }
1094 
1095 /*
1096  * bridge_ifdetach:
1097  *
1098  *	Detach an interface from a bridge.  Called when a member
1099  *	interface is detaching.
1100  */
1101 void
1102 bridge_ifdetach(struct ifnet *ifp)
1103 {
1104 	struct bridge_softc *sc = ifp->if_bridge;
1105 	struct ifbreq breq;
1106 
1107 	memset(&breq, 0, sizeof(breq));
1108 	snprintf(breq.ifbr_ifsname, sizeof(breq.ifbr_ifsname), ifp->if_xname);
1109 
1110 	lwkt_serialize_enter(ifp->if_serializer);
1111 	bridge_ioctl_del(sc, &breq);
1112 	lwkt_serialize_exit(ifp->if_serializer);
1113 }
1114 
1115 /*
1116  * bridge_init:
1117  *
1118  *	Initialize a bridge interface.
1119  */
1120 static void
1121 bridge_init(void *xsc)
1122 {
1123 	struct bridge_softc *sc = (struct bridge_softc *)xsc;
1124 	struct ifnet *ifp = sc->sc_ifp;
1125 
1126 	if (ifp->if_flags & IFF_RUNNING)
1127 		return;
1128 
1129 	callout_reset(&sc->sc_brcallout, bridge_rtable_prune_period * hz,
1130 	    bridge_timer, sc);
1131 
1132 	ifp->if_flags |= IFF_RUNNING;
1133 	bstp_initialization(sc);
1134 	return;
1135 }
1136 
1137 /*
1138  * bridge_stop:
1139  *
1140  *	Stop the bridge interface.
1141  */
1142 void
1143 bridge_stop(struct ifnet *ifp, int disable)
1144 {
1145 	struct bridge_softc *sc = ifp->if_softc;
1146 
1147 	ASSERT_SERIALIZED(ifp->if_serializer);
1148 
1149 	if ((ifp->if_flags & IFF_RUNNING) == 0)
1150 		return;
1151 
1152 	callout_stop(&sc->sc_brcallout);
1153 	bstp_stop(sc);
1154 
1155 	bridge_rtflush(sc, IFBF_FLUSHDYN);
1156 
1157 	ifp->if_flags &= ~IFF_RUNNING;
1158 }
1159 
1160 /*
1161  * bridge_enqueue:
1162  *
1163  *	Enqueue a packet on a bridge member interface.
1164  *
1165  */
1166 __inline void
1167 bridge_enqueue(struct bridge_softc *sc, struct ifnet *dst_ifp, struct mbuf *m)
1168 {
1169 	struct altq_pktattr pktattr;
1170 
1171 	/*
1172 	 * Clear any in-bound checksum flags for this packet.
1173 	 *
1174 	 * XXX this seems to mess up the output packet.
1175 	 */
1176 /*	m->m_pkthdr.csum_flags = 0;*/
1177 
1178 	while (m->m_type == MT_TAG) {
1179 		/* XXX see ether_output_frame for full rules check */
1180 		m = m->m_next;
1181 	}
1182 
1183 	lwkt_serialize_enter(dst_ifp->if_serializer);
1184 
1185 	if (ifq_is_enabled(&dst_ifp->if_snd))
1186 		altq_etherclassify(&dst_ifp->if_snd, m, &pktattr);
1187 
1188 	ifq_handoff(dst_ifp, m, &pktattr);
1189 
1190 	lwkt_serialize_exit(dst_ifp->if_serializer);
1191 }
1192 
1193 /*
1194  * bridge_output_serialized:
1195  *
1196  *	Send output from a bridge member interface.  This
1197  *	performs the bridging function for locally originated
1198  *	packets.
1199  *
1200  *	The mbuf has the Ethernet header already attached.  We must
1201  *	enqueue or free the mbuf before returning.
1202  */
1203 int
1204 bridge_output_serialized(struct ifnet *ifp, struct mbuf *m,
1205     struct sockaddr *sa, struct rtentry *rt)
1206 {
1207 	struct ether_header *eh;
1208 	struct ifnet *dst_if;
1209 	struct bridge_softc *sc;
1210 
1211 	sc = ifp->if_bridge;
1212 
1213 	ASSERT_SERIALIZED(ifp->if_serializer);
1214 
1215 	if (m->m_len < ETHER_HDR_LEN) {
1216 		m = m_pullup(m, ETHER_HDR_LEN);
1217 		if (m == NULL)
1218 			return (0);
1219 	}
1220 
1221 	/*
1222 	 * Serialize our bridge interface.  We have to get rid of the
1223 	 * originating interface lock to avoid a deadlock.
1224 	 */
1225 	lwkt_serialize_exit(ifp->if_serializer);
1226 	lwkt_serialize_enter(sc->sc_ifp->if_serializer);
1227 
1228 	eh = mtod(m, struct ether_header *);
1229 
1230 	/*
1231 	 * If bridge is down, but the original output interface is up,
1232 	 * go ahead and send out that interface.  Otherwise, the packet
1233 	 * is dropped below.
1234 	 */
1235 	if ((sc->sc_ifp->if_flags & IFF_RUNNING) == 0) {
1236 		dst_if = ifp;
1237 		goto sendunicast;
1238 	}
1239 
1240 	/*
1241 	 * If the packet is a multicast, or we don't know a better way to
1242 	 * get there, send to all interfaces.
1243 	 */
1244 	if (ETHER_IS_MULTICAST(eh->ether_dhost))
1245 		dst_if = NULL;
1246 	else
1247 		dst_if = bridge_rtlookup(sc, eh->ether_dhost);
1248 	if (dst_if == NULL) {
1249 		struct bridge_iflist *bif;
1250 		struct mbuf *mc;
1251 		int used = 0;
1252 
1253 		LIST_FOREACH(bif, &sc->sc_iflist, bif_next) {
1254 			dst_if = bif->bif_ifp;
1255 			if ((dst_if->if_flags & IFF_RUNNING) == 0)
1256 				continue;
1257 
1258 			/*
1259 			 * If this is not the original output interface,
1260 			 * and the interface is participating in spanning
1261 			 * tree, make sure the port is in a state that
1262 			 * allows forwarding.
1263 			 */
1264 			if (dst_if != ifp &&
1265 			    (bif->bif_flags & IFBIF_STP) != 0) {
1266 				switch (bif->bif_state) {
1267 				case BSTP_IFSTATE_BLOCKING:
1268 				case BSTP_IFSTATE_LISTENING:
1269 				case BSTP_IFSTATE_DISABLED:
1270 					continue;
1271 				}
1272 			}
1273 
1274 			if (LIST_NEXT(bif, bif_next) == NULL) {
1275 				used = 1;
1276 				mc = m;
1277 			} else {
1278 				mc = m_copypacket(m, MB_DONTWAIT);
1279 				if (mc == NULL) {
1280 					sc->sc_ifp->if_oerrors++;
1281 					continue;
1282 				}
1283 			}
1284 			lwkt_serialize_exit(sc->sc_ifp->if_serializer);
1285 			bridge_enqueue(sc, dst_if, mc);
1286 			lwkt_serialize_enter(sc->sc_ifp->if_serializer);
1287 		}
1288 		if (used == 0)
1289 			m_freem(m);
1290 		lwkt_serialize_exit(sc->sc_ifp->if_serializer);
1291 		goto done;
1292 	}
1293 
1294  sendunicast:
1295 	/*
1296 	 * XXX Spanning tree consideration here?
1297 	 */
1298 
1299 	lwkt_serialize_exit(sc->sc_ifp->if_serializer);
1300 	if ((dst_if->if_flags & IFF_RUNNING) == 0) {
1301 		m_freem(m);
1302 	} else {
1303 		bridge_enqueue(sc, dst_if, m);
1304 	}
1305 done:
1306 	lwkt_serialize_enter(ifp->if_serializer);
1307 	return (0);
1308 }
1309 
1310 /*
1311  * bridge_start:
1312  *
1313  *	Start output on a bridge.
1314  *
1315  */
1316 void
1317 bridge_start(struct ifnet *ifp)
1318 {
1319 	struct bridge_softc *sc;
1320 	struct mbuf *m;
1321 	struct ether_header *eh;
1322 	struct ifnet *dst_if;
1323 
1324 	sc = ifp->if_softc;
1325 
1326 	ifp->if_flags |= IFF_OACTIVE;
1327 	for (;;) {
1328 		m = ifq_dequeue(&ifp->if_snd, NULL);
1329 		if (m == 0)
1330 			break;
1331 		BPF_MTAP(ifp, m);
1332 		ifp->if_opackets++;
1333 
1334 		eh = mtod(m, struct ether_header *);
1335 		dst_if = NULL;
1336 
1337 		if ((m->m_flags & (M_BCAST|M_MCAST)) == 0) {
1338 			dst_if = bridge_rtlookup(sc, eh->ether_dhost);
1339 		}
1340 
1341 		if (dst_if == NULL)
1342 			bridge_broadcast(sc, ifp, m, 0);
1343 		else
1344 			bridge_enqueue(sc, dst_if, m);
1345 	}
1346 	ifp->if_flags &= ~IFF_OACTIVE;
1347 
1348 	return;
1349 }
1350 
1351 /*
1352  * bridge_forward:
1353  *
1354  *	The forwarding function of the bridge.
1355  */
1356 void
1357 bridge_forward(struct bridge_softc *sc, struct mbuf *m)
1358 {
1359 	struct bridge_iflist *bif;
1360 	struct ifnet *src_if, *dst_if, *ifp;
1361 	struct ether_header *eh;
1362 
1363 	src_if = m->m_pkthdr.rcvif;
1364 	ifp = sc->sc_ifp;
1365 
1366 	ASSERT_SERIALIZED(ifp->if_serializer);
1367 
1368 	sc->sc_ifp->if_ipackets++;
1369 	sc->sc_ifp->if_ibytes += m->m_pkthdr.len;
1370 
1371 	/*
1372 	 * Look up the bridge_iflist.
1373 	 */
1374 	bif = bridge_lookup_member_if(sc, src_if);
1375 	if (bif == NULL) {
1376 		/* Interface is not a bridge member (anymore?) */
1377 		m_freem(m);
1378 		return;
1379 	}
1380 
1381 	if (bif->bif_flags & IFBIF_STP) {
1382 		switch (bif->bif_state) {
1383 		case BSTP_IFSTATE_BLOCKING:
1384 		case BSTP_IFSTATE_LISTENING:
1385 		case BSTP_IFSTATE_DISABLED:
1386 			m_freem(m);
1387 			return;
1388 		}
1389 	}
1390 
1391 	eh = mtod(m, struct ether_header *);
1392 
1393 	/*
1394 	 * Various ifp's are used below, release the serializer for
1395 	 * the bridge ifp so other ifp serializers can be acquired.
1396 	 */
1397 	lwkt_serialize_exit(ifp->if_serializer);
1398 
1399 	/*
1400 	 * If the interface is learning, and the source
1401 	 * address is valid and not multicast, record
1402 	 * the address.
1403 	 */
1404 	if ((bif->bif_flags & IFBIF_LEARNING) != 0 &&
1405 	    ETHER_IS_MULTICAST(eh->ether_shost) == 0 &&
1406 	    (eh->ether_shost[0] == 0 &&
1407 	     eh->ether_shost[1] == 0 &&
1408 	     eh->ether_shost[2] == 0 &&
1409 	     eh->ether_shost[3] == 0 &&
1410 	     eh->ether_shost[4] == 0 &&
1411 	     eh->ether_shost[5] == 0) == 0) {
1412 		bridge_rtupdate(sc, eh->ether_shost, src_if, 0, IFBAF_DYNAMIC);
1413 	}
1414 
1415 	if ((bif->bif_flags & IFBIF_STP) != 0 &&
1416 	    bif->bif_state == BSTP_IFSTATE_LEARNING) {
1417 		m_freem(m);
1418 		goto done;
1419 	}
1420 
1421 	/*
1422 	 * At this point, the port either doesn't participate
1423 	 * in spanning tree or it is in the forwarding state.
1424 	 */
1425 
1426 	/*
1427 	 * If the packet is unicast, destined for someone on
1428 	 * "this" side of the bridge, drop it.
1429 	 */
1430 	if ((m->m_flags & (M_BCAST|M_MCAST)) == 0) {
1431 		dst_if = bridge_rtlookup(sc, eh->ether_dhost);
1432 		if (src_if == dst_if) {
1433 			m_freem(m);
1434 			goto done;
1435 		}
1436 	} else {
1437 		/* ...forward it to all interfaces. */
1438 		sc->sc_ifp->if_imcasts++;
1439 		dst_if = NULL;
1440 	}
1441 
1442 	/* run the packet filter */
1443 	if (inet_pfil_hook.ph_hashooks > 0
1444 #ifdef INET6
1445 	    || inet6_pfil_hook.ph_hashooks > 0
1446 #endif
1447 	    ) {
1448 		if (bridge_pfil(&m, ifp, src_if, PFIL_IN) != 0)
1449 			goto done;
1450 		if (m == NULL)
1451 			goto done;
1452 	}
1453 
1454 	if (dst_if == NULL) {
1455 		bridge_broadcast(sc, src_if, m, 1);
1456 		goto done;
1457 	}
1458 
1459 	/*
1460 	 * At this point, we're dealing with a unicast frame
1461 	 * going to a different interface.
1462 	 */
1463 	if ((dst_if->if_flags & IFF_RUNNING) == 0) {
1464 		m_freem(m);
1465 		goto done;
1466 	}
1467 	bif = bridge_lookup_member_if(sc, dst_if);
1468 	if (bif == NULL) {
1469 		/* Not a member of the bridge (anymore?) */
1470 		m_freem(m);
1471 		goto done;
1472 	}
1473 
1474 	if (bif->bif_flags & IFBIF_STP) {
1475 		switch (bif->bif_state) {
1476 		case BSTP_IFSTATE_DISABLED:
1477 		case BSTP_IFSTATE_BLOCKING:
1478 			m_freem(m);
1479 			goto done;
1480 		}
1481 	}
1482 
1483 	if (inet_pfil_hook.ph_hashooks > 0
1484 #ifdef INET6
1485 	    || inet6_pfil_hook.ph_hashooks > 0
1486 #endif
1487 	    ) {
1488 		if (bridge_pfil(&m, sc->sc_ifp, dst_if, PFIL_OUT) != 0)
1489 			goto done;
1490 		if (m == NULL)
1491 			goto done;
1492 	}
1493 	bridge_enqueue(sc, dst_if, m);
1494 
1495 	/*
1496 	 * ifp's serializer was held on entry and is expected to be held
1497 	 * on return.
1498 	 */
1499 done:
1500 	lwkt_serialize_enter(ifp->if_serializer);
1501 }
1502 
1503 /*
1504  * bridge_input:
1505  *
1506  *	Receive input from a member interface.  Queue the packet for
1507  *	bridging if it is not for us.
1508  */
1509 struct mbuf *
1510 bridge_input(struct ifnet *ifp, struct mbuf *m)
1511 {
1512 	struct bridge_softc *sc = ifp->if_bridge;
1513 	struct bridge_iflist *bif;
1514 	struct ifnet *bifp;
1515 	struct ether_header *eh;
1516 	struct mbuf *mc, *mc2;
1517 
1518 	bifp = sc->sc_ifp;
1519 	lwkt_serialize_enter(bifp->if_serializer);
1520 
1521 	if ((sc->sc_ifp->if_flags & IFF_RUNNING) == 0)
1522 		goto out;
1523 
1524 	bif = bridge_lookup_member_if(sc, ifp);
1525 	if (bif == NULL)
1526 		goto out;
1527 
1528 	eh = mtod(m, struct ether_header *);
1529 
1530 	m->m_flags &= ~M_PROTO1; /* XXX Hack - loop prevention */
1531 
1532 	/*
1533 	 * Tap all packets arriving on the bridge, no matter if
1534 	 * they are local destinations or not.  In is in.
1535 	 */
1536 	BPF_MTAP(bifp, m);
1537 
1538 #define IFP2AC(ifp) ((struct arpcom *)(ifp))
1539 #define IFP2ENADDR(ifp) (IFP2AC(ifp)->ac_enaddr)
1540 	if (memcmp(eh->ether_dhost, IFP2ENADDR(bifp),
1541 	    ETHER_ADDR_LEN) == 0) {
1542 		/*
1543 		 * If the packet is for us, set the packets source as the
1544 		 * bridge, and return the packet back to ether_input for
1545 		 * local processing.
1546 		 */
1547 
1548 		/* Mark the packet as arriving on the bridge interface */
1549 		m->m_pkthdr.rcvif = bifp;
1550 		bifp->if_ipackets++;
1551 
1552 		goto out;
1553 	}
1554 
1555 	if (ETHER_IS_MULTICAST(eh->ether_dhost)) {
1556 		/* Tap off 802.1D packets; they do not get forwarded. */
1557 		if (memcmp(eh->ether_dhost, bstp_etheraddr,
1558 		    ETHER_ADDR_LEN) == 0) {
1559 			m = bstp_input(ifp, m);
1560 			if (m == NULL)
1561 				goto out;
1562 		}
1563 
1564 		if (bif->bif_flags & IFBIF_STP) {
1565 			switch (bif->bif_state) {
1566 			case BSTP_IFSTATE_BLOCKING:
1567 			case BSTP_IFSTATE_LISTENING:
1568 			case BSTP_IFSTATE_DISABLED:
1569 				goto out;
1570 			}
1571 		}
1572 
1573 		if (bcmp(etherbroadcastaddr, eh->ether_dhost,
1574 		    sizeof(etherbroadcastaddr)) == 0)
1575 			m->m_flags |= M_BCAST;
1576 		else
1577 			m->m_flags |= M_MCAST;
1578 
1579 		/*
1580 		 * Make a deep copy of the packet and enqueue the copy
1581 		 * for bridge processing; return the original packet for
1582 		 * local processing.
1583 		 */
1584 		mc = m_dup(m, MB_DONTWAIT);
1585 		if (mc == NULL)
1586 			goto out;
1587 
1588 		bridge_forward(sc, mc);
1589 
1590 		/*
1591 		 * Reinject the mbuf as arriving on the bridge so we have a
1592 		 * chance at claiming multicast packets. We can not loop back
1593 		 * here from ether_input as a bridge is never a member of a
1594 		 * bridge.
1595 		 */
1596 		KASSERT(bifp->if_bridge == NULL,
1597 		    ("loop created in bridge_input"));
1598 		mc2 = m_copypacket(m, MB_DONTWAIT);
1599 		if (mc2 != NULL) {
1600 			mc2->m_pkthdr.rcvif = bifp;
1601 			(*bifp->if_input)(bifp, mc2);
1602 		}
1603 
1604 		/* Return the original packet for local processing. */
1605 		goto out;
1606 	}
1607 
1608 	if (bif->bif_flags & IFBIF_STP) {
1609 		switch (bif->bif_state) {
1610 		case BSTP_IFSTATE_BLOCKING:
1611 		case BSTP_IFSTATE_LISTENING:
1612 		case BSTP_IFSTATE_DISABLED:
1613 			goto out;
1614 		}
1615 	}
1616 
1617 	/*
1618 	 * Unicast.  Make sure it's not for us.
1619 	 */
1620 	LIST_FOREACH(bif, &sc->sc_iflist, bif_next) {
1621 		if (bif->bif_ifp->if_type != IFT_ETHER)
1622 			continue;
1623 		/* It is destined for us. */
1624 		if (memcmp(IF_LLADDR(bif->bif_ifp), eh->ether_dhost,
1625 		    ETHER_ADDR_LEN) == 0) {
1626 			if (bif->bif_flags & IFBIF_LEARNING)
1627 				bridge_rtupdate(sc,
1628 				    eh->ether_shost, ifp, 0, IFBAF_DYNAMIC);
1629 			m->m_pkthdr.rcvif = bif->bif_ifp;
1630 			if (ifp->if_type == IFT_GIF) {
1631 				m->m_flags |= M_PROTO1;
1632 				/*
1633 				 * Avoid an interface ordering deadlock.
1634 				 */
1635 				lwkt_serialize_exit(bifp->if_serializer);
1636 				lwkt_serialize_enter(bif->bif_ifp->if_serializer);
1637 				(*bif->bif_ifp->if_input)(bif->bif_ifp, m);
1638 				lwkt_serialize_exit(bif->bif_ifp->if_serializer);
1639 				lwkt_serialize_enter(bifp->if_serializer);
1640 				m = NULL;
1641 			}
1642 			goto out;
1643 		}
1644 
1645 		/* We just received a packet that we sent out. */
1646 		if (memcmp(IF_LLADDR(bif->bif_ifp), eh->ether_shost,
1647 		    ETHER_ADDR_LEN) == 0) {
1648 			m_freem(m);
1649 			m = NULL;
1650 			goto out;
1651 		}
1652 	}
1653 
1654 	/* Perform the bridge forwarding function. */
1655 	bridge_forward(sc, m);
1656 	m = NULL;
1657 
1658 out:
1659 	lwkt_serialize_exit(bifp->if_serializer);
1660 	return m;
1661 }
1662 
1663 /*
1664  * bridge_broadcast:
1665  *
1666  *	Send a frame to all interfaces that are members of
1667  *	the bridge, except for the one on which the packet
1668  *	arrived.
1669  */
1670 void
1671 bridge_broadcast(struct bridge_softc *sc, struct ifnet *src_if,
1672     struct mbuf *m, int runfilt)
1673 {
1674 	struct bridge_iflist *bif;
1675 	struct mbuf *mc;
1676 	struct ifnet *dst_if;
1677 	int used = 0;
1678 
1679 	/* Filter on the bridge interface before broadcasting */
1680 	if (runfilt && (inet_pfil_hook.ph_hashooks > 0
1681 #ifdef INET6
1682             || inet6_pfil_hook.ph_hashooks > 0
1683 #endif
1684 	    )) {
1685 		if (bridge_pfil(&m, sc->sc_ifp, NULL, PFIL_OUT) != 0)
1686 			return;
1687 		if (m == NULL)
1688 			return;
1689 	}
1690 
1691 	LIST_FOREACH(bif, &sc->sc_iflist, bif_next) {
1692 		dst_if = bif->bif_ifp;
1693 		if (dst_if == src_if)
1694 			continue;
1695 
1696 		if (bif->bif_flags & IFBIF_STP) {
1697 			switch (bif->bif_state) {
1698 			case BSTP_IFSTATE_BLOCKING:
1699 			case BSTP_IFSTATE_DISABLED:
1700 				continue;
1701 			}
1702 		}
1703 
1704 		if ((bif->bif_flags & IFBIF_DISCOVER) == 0 &&
1705 		    (m->m_flags & (M_BCAST|M_MCAST)) == 0)
1706 			continue;
1707 
1708 		if ((dst_if->if_flags & IFF_RUNNING) == 0)
1709 			continue;
1710 
1711 		if (LIST_NEXT(bif, bif_next) == NULL) {
1712 			mc = m;
1713 			used = 1;
1714 		} else {
1715 			mc = m_copypacket(m, MB_DONTWAIT);
1716 			if (mc == NULL) {
1717 				sc->sc_ifp->if_oerrors++;
1718 				continue;
1719 			}
1720 		}
1721 
1722 		/*
1723 		 * Filter on the output interface. Pass a NULL bridge interface
1724 		 * pointer so we do not redundantly filter on the bridge for
1725 		 * each interface we broadcast on.
1726 		 */
1727 		if (runfilt && (inet_pfil_hook.ph_hashooks > 0
1728 #ifdef INET6
1729 		    || inet6_pfil_hook.ph_hashooks > 0
1730 #endif
1731 		    )) {
1732 			if (bridge_pfil(&m, NULL, dst_if, PFIL_OUT) != 0)
1733 				return;
1734 			if (m == NULL)
1735 				return;
1736 		}
1737 
1738 		bridge_enqueue(sc, dst_if, mc);
1739 	}
1740 	if (used == 0)
1741 		m_freem(m);
1742 }
1743 
1744 /*
1745  * bridge_rtupdate:
1746  *
1747  *	Add a bridge routing entry.
1748  */
1749 int
1750 bridge_rtupdate(struct bridge_softc *sc, const uint8_t *dst,
1751     struct ifnet *dst_if, int setflags, uint8_t flags)
1752 {
1753 	struct bridge_rtnode *brt;
1754 	int error;
1755 
1756 	/*
1757 	 * A route for this destination might already exist.  If so,
1758 	 * update it, otherwise create a new one.
1759 	 */
1760 	if ((brt = bridge_rtnode_lookup(sc, dst)) == NULL) {
1761 		if (sc->sc_brtcnt >= sc->sc_brtmax)
1762 			return (ENOSPC);
1763 
1764 		/*
1765 		 * Allocate a new bridge forwarding node, and
1766 		 * initialize the expiration time and Ethernet
1767 		 * address.
1768 		 */
1769 		brt = malloc(sizeof(struct bridge_rtnode), M_DEVBUF, M_NOWAIT|M_ZERO);
1770 		if (brt == NULL)
1771 			return (ENOMEM);
1772 
1773 		brt->brt_expire = time_second + sc->sc_brttimeout;
1774 		brt->brt_flags = IFBAF_DYNAMIC;
1775 		memcpy(brt->brt_addr, dst, ETHER_ADDR_LEN);
1776 
1777 		if ((error = bridge_rtnode_insert(sc, brt)) != 0) {
1778 			free(brt, M_DEVBUF);
1779 			return (error);
1780 		}
1781 	}
1782 
1783 	brt->brt_ifp = dst_if;
1784 	if (setflags) {
1785 		brt->brt_flags = flags;
1786 		brt->brt_expire = (flags & IFBAF_STATIC) ? 0 :
1787 		    time_second + sc->sc_brttimeout;
1788 	}
1789 
1790 	return (0);
1791 }
1792 
1793 /*
1794  * bridge_rtlookup:
1795  *
1796  *	Lookup the destination interface for an address.
1797  */
1798 struct ifnet *
1799 bridge_rtlookup(struct bridge_softc *sc, const uint8_t *addr)
1800 {
1801 	struct bridge_rtnode *brt;
1802 
1803 	if ((brt = bridge_rtnode_lookup(sc, addr)) == NULL)
1804 		return (NULL);
1805 
1806 	return (brt->brt_ifp);
1807 }
1808 
1809 /*
1810  * bridge_rttrim:
1811  *
1812  *	Trim the routine table so that we have a number
1813  *	of routing entries less than or equal to the
1814  *	maximum number.
1815  */
1816 void
1817 bridge_rttrim(struct bridge_softc *sc)
1818 {
1819 	struct bridge_rtnode *brt, *nbrt;
1820 
1821 	/* Make sure we actually need to do this. */
1822 	if (sc->sc_brtcnt <= sc->sc_brtmax)
1823 		return;
1824 
1825 	/* Force an aging cycle; this might trim enough addresses. */
1826 	bridge_rtage(sc);
1827 	if (sc->sc_brtcnt <= sc->sc_brtmax)
1828 		return;
1829 
1830 	for (brt = LIST_FIRST(&sc->sc_rtlist); brt != NULL; brt = nbrt) {
1831 		nbrt = LIST_NEXT(brt, brt_list);
1832 		if ((brt->brt_flags & IFBAF_TYPEMASK) == IFBAF_DYNAMIC) {
1833 			bridge_rtnode_destroy(sc, brt);
1834 			if (sc->sc_brtcnt <= sc->sc_brtmax)
1835 				return;
1836 		}
1837 	}
1838 }
1839 
1840 /*
1841  * bridge_timer:
1842  *
1843  *	Aging timer for the bridge.
1844  */
1845 void
1846 bridge_timer(void *arg)
1847 {
1848 	struct bridge_softc *sc = arg;
1849 
1850 	lwkt_serialize_enter(sc->sc_ifp->if_serializer);
1851 
1852 	bridge_rtage(sc);
1853 
1854 	if (sc->sc_ifp->if_flags & IFF_RUNNING)
1855 		callout_reset(&sc->sc_brcallout,
1856 		    bridge_rtable_prune_period * hz, bridge_timer, sc);
1857 
1858 	lwkt_serialize_exit(sc->sc_ifp->if_serializer);
1859 }
1860 
1861 /*
1862  * bridge_rtage:
1863  *
1864  *	Perform an aging cycle.
1865  */
1866 void
1867 bridge_rtage(struct bridge_softc *sc)
1868 {
1869 	struct bridge_rtnode *brt, *nbrt;
1870 
1871 	for (brt = LIST_FIRST(&sc->sc_rtlist); brt != NULL; brt = nbrt) {
1872 		nbrt = LIST_NEXT(brt, brt_list);
1873 		if ((brt->brt_flags & IFBAF_TYPEMASK) == IFBAF_DYNAMIC) {
1874 			if (time_second >= brt->brt_expire)
1875 				bridge_rtnode_destroy(sc, brt);
1876 		}
1877 	}
1878 }
1879 
1880 /*
1881  * bridge_rtflush:
1882  *
1883  *	Remove all dynamic addresses from the bridge.
1884  */
1885 void
1886 bridge_rtflush(struct bridge_softc *sc, int full)
1887 {
1888 	struct bridge_rtnode *brt, *nbrt;
1889 
1890 	for (brt = LIST_FIRST(&sc->sc_rtlist); brt != NULL; brt = nbrt) {
1891 		nbrt = LIST_NEXT(brt, brt_list);
1892 		if (full || (brt->brt_flags & IFBAF_TYPEMASK) == IFBAF_DYNAMIC)
1893 			bridge_rtnode_destroy(sc, brt);
1894 	}
1895 }
1896 
1897 /*
1898  * bridge_rtdaddr:
1899  *
1900  *	Remove an address from the table.
1901  */
1902 int
1903 bridge_rtdaddr(struct bridge_softc *sc, const uint8_t *addr)
1904 {
1905 	struct bridge_rtnode *brt;
1906 
1907 	if ((brt = bridge_rtnode_lookup(sc, addr)) == NULL)
1908 		return (ENOENT);
1909 
1910 	bridge_rtnode_destroy(sc, brt);
1911 	return (0);
1912 }
1913 
1914 /*
1915  * bridge_rtdelete:
1916  *
1917  *	Delete routes to a speicifc member interface.
1918  */
1919 void
1920 bridge_rtdelete(struct bridge_softc *sc, struct ifnet *ifp, int full)
1921 {
1922 	struct bridge_rtnode *brt, *nbrt;
1923 
1924 	for (brt = LIST_FIRST(&sc->sc_rtlist); brt != NULL; brt = nbrt) {
1925 		nbrt = LIST_NEXT(brt, brt_list);
1926 		if (brt->brt_ifp == ifp && (full ||
1927 			    (brt->brt_flags & IFBAF_TYPEMASK) == IFBAF_DYNAMIC))
1928 			bridge_rtnode_destroy(sc, brt);
1929 	}
1930 }
1931 
1932 /*
1933  * bridge_rtable_init:
1934  *
1935  *	Initialize the route table for this bridge.
1936  */
1937 int
1938 bridge_rtable_init(struct bridge_softc *sc)
1939 {
1940 	int i;
1941 
1942 	sc->sc_rthash = malloc(sizeof(*sc->sc_rthash) * BRIDGE_RTHASH_SIZE,
1943 	    M_DEVBUF, M_NOWAIT);
1944 	if (sc->sc_rthash == NULL)
1945 		return (ENOMEM);
1946 
1947 	for (i = 0; i < BRIDGE_RTHASH_SIZE; i++)
1948 		LIST_INIT(&sc->sc_rthash[i]);
1949 
1950 	sc->sc_rthash_key = arc4random();
1951 
1952 	LIST_INIT(&sc->sc_rtlist);
1953 
1954 	return (0);
1955 }
1956 
1957 /*
1958  * bridge_rtable_fini:
1959  *
1960  *	Deconstruct the route table for this bridge.
1961  */
1962 void
1963 bridge_rtable_fini(struct bridge_softc *sc)
1964 {
1965 
1966 	free(sc->sc_rthash, M_DEVBUF);
1967 }
1968 
1969 /*
1970  * The following hash function is adapted from "Hash Functions" by Bob Jenkins
1971  * ("Algorithm Alley", Dr. Dobbs Journal, September 1997).
1972  */
1973 #define	mix(a, b, c)							\
1974 do {									\
1975 	a -= b; a -= c; a ^= (c >> 13);					\
1976 	b -= c; b -= a; b ^= (a << 8);					\
1977 	c -= a; c -= b; c ^= (b >> 13);					\
1978 	a -= b; a -= c; a ^= (c >> 12);					\
1979 	b -= c; b -= a; b ^= (a << 16);					\
1980 	c -= a; c -= b; c ^= (b >> 5);					\
1981 	a -= b; a -= c; a ^= (c >> 3);					\
1982 	b -= c; b -= a; b ^= (a << 10);					\
1983 	c -= a; c -= b; c ^= (b >> 15);					\
1984 } while (/*CONSTCOND*/0)
1985 
1986 static __inline uint32_t
1987 bridge_rthash(struct bridge_softc *sc, const uint8_t *addr)
1988 {
1989 	uint32_t a = 0x9e3779b9, b = 0x9e3779b9, c = sc->sc_rthash_key;
1990 
1991 	b += addr[5] << 8;
1992 	b += addr[4];
1993 	a += addr[3] << 24;
1994 	a += addr[2] << 16;
1995 	a += addr[1] << 8;
1996 	a += addr[0];
1997 
1998 	mix(a, b, c);
1999 
2000 	return (c & BRIDGE_RTHASH_MASK);
2001 }
2002 
2003 #undef mix
2004 
2005 /*
2006  * bridge_rtnode_lookup:
2007  *
2008  *	Look up a bridge route node for the specified destination.
2009  */
2010 struct bridge_rtnode *
2011 bridge_rtnode_lookup(struct bridge_softc *sc, const uint8_t *addr)
2012 {
2013 	struct bridge_rtnode *brt;
2014 	uint32_t hash;
2015 	int dir;
2016 
2017 	hash = bridge_rthash(sc, addr);
2018 	LIST_FOREACH(brt, &sc->sc_rthash[hash], brt_hash) {
2019 		dir = memcmp(addr, brt->brt_addr, ETHER_ADDR_LEN);
2020 		if (dir == 0)
2021 			return (brt);
2022 		if (dir > 0)
2023 			return (NULL);
2024 	}
2025 
2026 	return (NULL);
2027 }
2028 
2029 /*
2030  * bridge_rtnode_insert:
2031  *
2032  *	Insert the specified bridge node into the route table.  We
2033  *	assume the entry is not already in the table.
2034  */
2035 int
2036 bridge_rtnode_insert(struct bridge_softc *sc, struct bridge_rtnode *brt)
2037 {
2038 	struct bridge_rtnode *lbrt;
2039 	uint32_t hash;
2040 	int dir;
2041 
2042 	hash = bridge_rthash(sc, brt->brt_addr);
2043 
2044 	lbrt = LIST_FIRST(&sc->sc_rthash[hash]);
2045 	if (lbrt == NULL) {
2046 		LIST_INSERT_HEAD(&sc->sc_rthash[hash], brt, brt_hash);
2047 		goto out;
2048 	}
2049 
2050 	do {
2051 		dir = memcmp(brt->brt_addr, lbrt->brt_addr, ETHER_ADDR_LEN);
2052 		if (dir == 0)
2053 			return (EEXIST);
2054 		if (dir > 0) {
2055 			LIST_INSERT_BEFORE(lbrt, brt, brt_hash);
2056 			goto out;
2057 		}
2058 		if (LIST_NEXT(lbrt, brt_hash) == NULL) {
2059 			LIST_INSERT_AFTER(lbrt, brt, brt_hash);
2060 			goto out;
2061 		}
2062 		lbrt = LIST_NEXT(lbrt, brt_hash);
2063 	} while (lbrt != NULL);
2064 
2065 #ifdef DIAGNOSTIC
2066 	panic("bridge_rtnode_insert: impossible");
2067 #endif
2068 
2069  out:
2070 	LIST_INSERT_HEAD(&sc->sc_rtlist, brt, brt_list);
2071 	sc->sc_brtcnt++;
2072 
2073 	return (0);
2074 }
2075 
2076 /*
2077  * bridge_rtnode_destroy:
2078  *
2079  *	Destroy a bridge rtnode.
2080  */
2081 void
2082 bridge_rtnode_destroy(struct bridge_softc *sc, struct bridge_rtnode *brt)
2083 {
2084 
2085 	LIST_REMOVE(brt, brt_hash);
2086 
2087 	LIST_REMOVE(brt, brt_list);
2088 	sc->sc_brtcnt--;
2089 	free(brt, M_DEVBUF);
2090 }
2091 
2092 /*
2093  * Send bridge packets through pfil if they are one of the types pfil can deal
2094  * with, or if they are ARP or REVARP.  (pfil will pass ARP and REVARP without
2095  * question.) If *bifp or *ifp are NULL then packet filtering is skipped for
2096  * that interface.
2097  */
2098 static int
2099 bridge_pfil(struct mbuf **mp, struct ifnet *bifp, struct ifnet *ifp, int dir)
2100 {
2101 	int snap, error, i;
2102 	struct ether_header *eh1, eh2;
2103 	struct ip *ip;
2104 	struct llc llc1;
2105 	u_int16_t ether_type;
2106 
2107 	snap = 0;
2108 	error = -1;	/* Default error if not error == 0 */
2109 
2110 	i = min((*mp)->m_pkthdr.len, max_protohdr);
2111 	if ((*mp)->m_len < i) {
2112 	    *mp = m_pullup(*mp, i);
2113 	    if (*mp == NULL) {
2114 		printf("%s: m_pullup failed\n", __func__);
2115 		return -1;
2116 	    }
2117 	}
2118 
2119 	eh1 = mtod(*mp, struct ether_header *);
2120 	ether_type = ntohs(eh1->ether_type);
2121 
2122 	/*
2123 	 * Check for SNAP/LLC.
2124 	 */
2125 	if (ether_type < ETHERMTU) {
2126 		struct llc *llc2 = (struct llc *)(eh1 + 1);
2127 
2128 		if ((*mp)->m_len >= ETHER_HDR_LEN + 8 &&
2129 		    llc2->llc_dsap == LLC_SNAP_LSAP &&
2130 		    llc2->llc_ssap == LLC_SNAP_LSAP &&
2131 		    llc2->llc_control == LLC_UI) {
2132 			ether_type = htons(llc2->llc_un.type_snap.ether_type);
2133 			snap = 1;
2134 		}
2135 	}
2136 
2137 	/*
2138 	 * If we're trying to filter bridge traffic, don't look at anything
2139 	 * other than IP and ARP traffic.  If the filter doesn't understand
2140 	 * IPv6, don't allow IPv6 through the bridge either.  This is lame
2141 	 * since if we really wanted, say, an AppleTalk filter, we are hosed,
2142 	 * but of course we don't have an AppleTalk filter to begin with.
2143 	 * (Note that since pfil doesn't understand ARP it will pass *ALL*
2144 	 * ARP traffic.)
2145 	 */
2146 	switch (ether_type) {
2147 		case ETHERTYPE_ARP:
2148 		case ETHERTYPE_REVARP:
2149 			return 0; /* Automatically pass */
2150 		case ETHERTYPE_IP:
2151 # ifdef INET6
2152 		case ETHERTYPE_IPV6:
2153 # endif /* INET6 */
2154 			break;
2155 		default:
2156 			goto bad;
2157 	}
2158 
2159 	/* Strip off the Ethernet header and keep a copy. */
2160 	m_copydata(*mp, 0, ETHER_HDR_LEN, (caddr_t) &eh2);
2161 	m_adj(*mp, ETHER_HDR_LEN);
2162 
2163 	/* Strip off snap header, if present */
2164 	if (snap) {
2165 		m_copydata(*mp, 0, sizeof(struct llc), (caddr_t) &llc1);
2166 		m_adj(*mp, sizeof(struct llc));
2167 	}
2168 
2169 	/*
2170 	 * Check the IP header for alignment and errors
2171 	 */
2172 	if (dir == PFIL_IN) {
2173 		switch (ether_type) {
2174 			case ETHERTYPE_IP:
2175 				error = bridge_ip_checkbasic(mp);
2176 				break;
2177 # ifdef INET6
2178 			case ETHERTYPE_IPV6:
2179 				error = bridge_ip6_checkbasic(mp);
2180 				break;
2181 # endif /* INET6 */
2182 			default:
2183 				error = 0;
2184 		}
2185 		if (error)
2186 			goto bad;
2187 	}
2188 
2189 	error = 0;
2190 
2191 	/*
2192 	 * Run the packet through pfil
2193 	 */
2194 	switch (ether_type)
2195 	{
2196 	case ETHERTYPE_IP :
2197 		/*
2198 		 * before calling the firewall, swap fields the same as
2199 		 * IP does. here we assume the header is contiguous
2200 		 */
2201 		ip = mtod(*mp, struct ip *);
2202 
2203 		ip->ip_len = ntohs(ip->ip_len);
2204 		ip->ip_off = ntohs(ip->ip_off);
2205 
2206 		/*
2207 		 * Run pfil on the member interface and the bridge, both can
2208 		 * be skipped by clearing pfil_member or pfil_bridge.
2209 		 *
2210 		 * Keep the order:
2211 		 *   in_if -> bridge_if -> out_if
2212 		 */
2213 		if (pfil_bridge && dir == PFIL_OUT && bifp != NULL)
2214 			error = pfil_run_hooks(&inet_pfil_hook, mp, bifp,
2215 					dir);
2216 
2217 		if (*mp == NULL || error != 0) /* filter may consume */
2218 			break;
2219 
2220 		if (pfil_member && ifp != NULL)
2221 			error = pfil_run_hooks(&inet_pfil_hook, mp, ifp,
2222 					dir);
2223 
2224 		if (*mp == NULL || error != 0) /* filter may consume */
2225 			break;
2226 
2227 		if (pfil_bridge && dir == PFIL_IN && bifp != NULL)
2228 			error = pfil_run_hooks(&inet_pfil_hook, mp, bifp,
2229 					dir);
2230 
2231 		/* Restore ip and the fields ntohs()'d. */
2232 		if (*mp != NULL && error == 0) {
2233 			ip = mtod(*mp, struct ip *);
2234 			ip->ip_len = htons(ip->ip_len);
2235 			ip->ip_off = htons(ip->ip_off);
2236 		}
2237 
2238 		break;
2239 # ifdef INET6
2240 	case ETHERTYPE_IPV6 :
2241 		if (pfil_bridge && dir == PFIL_OUT && bifp != NULL)
2242 			error = pfil_run_hooks(&inet6_pfil_hook, mp, bifp,
2243 					dir);
2244 
2245 		if (*mp == NULL || error != 0) /* filter may consume */
2246 			break;
2247 
2248 		if (pfil_member && ifp != NULL)
2249 			error = pfil_run_hooks(&inet6_pfil_hook, mp, ifp,
2250 					dir);
2251 
2252 		if (*mp == NULL || error != 0) /* filter may consume */
2253 			break;
2254 
2255 		if (pfil_bridge && dir == PFIL_IN && bifp != NULL)
2256 			error = pfil_run_hooks(&inet6_pfil_hook, mp, bifp,
2257 					dir);
2258 		break;
2259 # endif
2260 	default :
2261 		error = 0;
2262 		break;
2263 	}
2264 
2265 	if (*mp == NULL)
2266 		return error;
2267 	if (error != 0)
2268 		goto bad;
2269 
2270 	error = -1;
2271 
2272 	/*
2273 	 * Finally, put everything back the way it was and return
2274 	 */
2275 	if (snap) {
2276 		M_PREPEND(*mp, sizeof(struct llc), MB_DONTWAIT);
2277 		if (*mp == NULL)
2278 			return error;
2279 		bcopy(&llc1, mtod(*mp, caddr_t), sizeof(struct llc));
2280 	}
2281 
2282 	M_PREPEND(*mp, ETHER_HDR_LEN, MB_DONTWAIT);
2283 	if (*mp == NULL)
2284 		return error;
2285 	bcopy(&eh2, mtod(*mp, caddr_t), ETHER_HDR_LEN);
2286 
2287 	return 0;
2288 
2289     bad:
2290 	m_freem(*mp);
2291 	*mp = NULL;
2292 	return error;
2293 }
2294 
2295 /*
2296  * Perform basic checks on header size since
2297  * pfil assumes ip_input has already processed
2298  * it for it.  Cut-and-pasted from ip_input.c.
2299  * Given how simple the IPv6 version is,
2300  * does the IPv4 version really need to be
2301  * this complicated?
2302  *
2303  * XXX Should we update ipstat here, or not?
2304  * XXX Right now we update ipstat but not
2305  * XXX csum_counter.
2306  */
2307 static int
2308 bridge_ip_checkbasic(struct mbuf **mp)
2309 {
2310 	struct mbuf *m = *mp;
2311 	struct ip *ip;
2312 	int len, hlen;
2313 	u_short sum;
2314 
2315 	if (*mp == NULL)
2316 		return -1;
2317 #if notyet
2318 	if (IP_HDR_ALIGNED_P(mtod(m, caddr_t)) == 0) {
2319 		if ((m = m_copyup(m, sizeof(struct ip),
2320 			(max_linkhdr + 3) & ~3)) == NULL) {
2321 			/* XXXJRT new stat, please */
2322 			ipstat.ips_toosmall++;
2323 			goto bad;
2324 		}
2325 	} else
2326 #endif
2327 #ifndef __predict_false
2328 #define __predict_false(x) x
2329 #endif
2330 	 if (__predict_false(m->m_len < sizeof (struct ip))) {
2331 		if ((m = m_pullup(m, sizeof (struct ip))) == NULL) {
2332 			ipstat.ips_toosmall++;
2333 			goto bad;
2334 		}
2335 	}
2336 	ip = mtod(m, struct ip *);
2337 	if (ip == NULL) goto bad;
2338 
2339 	if (ip->ip_v != IPVERSION) {
2340 		ipstat.ips_badvers++;
2341 		goto bad;
2342 	}
2343 	hlen = ip->ip_hl << 2;
2344 	if (hlen < sizeof(struct ip)) { /* minimum header length */
2345 		ipstat.ips_badhlen++;
2346 		goto bad;
2347 	}
2348 	if (hlen > m->m_len) {
2349 		if ((m = m_pullup(m, hlen)) == 0) {
2350 			ipstat.ips_badhlen++;
2351 			goto bad;
2352 		}
2353 		ip = mtod(m, struct ip *);
2354 		if (ip == NULL) goto bad;
2355 	}
2356 
2357 	if (m->m_pkthdr.csum_flags & CSUM_IP_CHECKED) {
2358 		sum = !(m->m_pkthdr.csum_flags & CSUM_IP_VALID);
2359 	} else {
2360 		if (hlen == sizeof(struct ip)) {
2361 			sum = in_cksum_hdr(ip);
2362 		} else {
2363 			sum = in_cksum(m, hlen);
2364 		}
2365 	}
2366 	if (sum) {
2367 		ipstat.ips_badsum++;
2368 		goto bad;
2369 	}
2370 
2371 	/* Retrieve the packet length. */
2372 	len = ntohs(ip->ip_len);
2373 
2374 	/*
2375 	 * Check for additional length bogosity
2376 	 */
2377 	if (len < hlen) {
2378 		ipstat.ips_badlen++;
2379 		goto bad;
2380 	}
2381 
2382 	/*
2383 	 * Check that the amount of data in the buffers
2384 	 * is as at least much as the IP header would have us expect.
2385 	 * Drop packet if shorter than we expect.
2386 	 */
2387 	if (m->m_pkthdr.len < len) {
2388 		ipstat.ips_tooshort++;
2389 		goto bad;
2390 	}
2391 
2392 	/* Checks out, proceed */
2393 	*mp = m;
2394 	return 0;
2395 
2396     bad:
2397 	*mp = m;
2398 	return -1;
2399 }
2400 
2401 # ifdef INET6
2402 /*
2403  * Same as above, but for IPv6.
2404  * Cut-and-pasted from ip6_input.c.
2405  * XXX Should we update ip6stat, or not?
2406  */
2407 static int
2408 bridge_ip6_checkbasic(struct mbuf **mp)
2409 {
2410 	struct mbuf *m = *mp;
2411 	struct ip6_hdr *ip6;
2412 
2413 	/*
2414 	 * If the IPv6 header is not aligned, slurp it up into a new
2415 	 * mbuf with space for link headers, in the event we forward
2416 	 * it.  Otherwise, if it is aligned, make sure the entire base
2417 	 * IPv6 header is in the first mbuf of the chain.
2418 	 */
2419 #if notyet
2420 	if (IP6_HDR_ALIGNED_P(mtod(m, caddr_t)) == 0) {
2421 		struct ifnet *inifp = m->m_pkthdr.rcvif;
2422 		if ((m = m_copyup(m, sizeof(struct ip6_hdr),
2423 			    (max_linkhdr + 3) & ~3)) == NULL) {
2424 			/* XXXJRT new stat, please */
2425 			ip6stat.ip6s_toosmall++;
2426 			in6_ifstat_inc(inifp, ifs6_in_hdrerr);
2427 			goto bad;
2428 		}
2429 	} else
2430 #endif
2431         if (__predict_false(m->m_len < sizeof(struct ip6_hdr))) {
2432 		struct ifnet *inifp = m->m_pkthdr.rcvif;
2433 		if ((m = m_pullup(m, sizeof(struct ip6_hdr))) == NULL) {
2434 			ip6stat.ip6s_toosmall++;
2435 			in6_ifstat_inc(inifp, ifs6_in_hdrerr);
2436 			goto bad;
2437 		}
2438 	}
2439 
2440 	ip6 = mtod(m, struct ip6_hdr *);
2441 
2442 	if ((ip6->ip6_vfc & IPV6_VERSION_MASK) != IPV6_VERSION) {
2443 		ip6stat.ip6s_badvers++;
2444 		in6_ifstat_inc(m->m_pkthdr.rcvif, ifs6_in_hdrerr);
2445 		goto bad;
2446 	}
2447 
2448 	/* Checks out, proceed */
2449 	*mp = m;
2450 	return 0;
2451 
2452     bad:
2453 	*mp = m;
2454 	return -1;
2455 }
2456 # endif /* INET6 */
2457