xref: /dragonfly/sys/netgraph/fec/ng_fec.c (revision cc93b0eb)
1 /*
2  * ng_fec.c
3  *
4  * Copyright (c) 2001 Berkeley Software Design, Inc.
5  * Copyright (c) 2000, 2001
6  *	Bill Paul <wpaul@osd.bsdi.com>.  All rights reserved.
7  *
8  * Redistribution and use in source and binary forms, with or without
9  * modification, are permitted provided that the following conditions
10  * are met:
11  * 1. Redistributions of source code must retain the above copyright
12  *    notice, this list of conditions and the following disclaimer.
13  * 2. Redistributions in binary form must reproduce the above copyright
14  *    notice, this list of conditions and the following disclaimer in the
15  *    documentation and/or other materials provided with the distribution.
16  * 3. All advertising materials mentioning features or use of this software
17  *    must display the following acknowledgement:
18  *	This product includes software developed by Bill Paul.
19  * 4. Neither the name of the author nor the names of any co-contributors
20  *    may be used to endorse or promote products derived from this software
21  *    without specific prior written permission.
22  *
23  * THIS SOFTWARE IS PROVIDED BY Bill Paul AND CONTRIBUTORS ``AS IS'' AND
24  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
25  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
26  * ARE DISCLAIMED.  IN NO EVENT SHALL Bill Paul OR THE VOICES IN HIS HEAD
27  * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
28  * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
29  * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
30  * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
31  * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
32  * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF
33  * THE POSSIBILITY OF SUCH DAMAGE.
34  *
35  * $FreeBSD: src/sys/netgraph/ng_fec.c,v 1.1.2.1 2002/11/01 21:39:31 julian Exp $
36  * $DragonFly: src/sys/netgraph/fec/ng_fec.c,v 1.26 2008/05/28 12:11:13 sephe Exp $
37  */
38 /*
39  * Copyright (c) 1996-1999 Whistle Communications, Inc.
40  * All rights reserved.
41  *
42  * Subject to the following obligations and disclaimer of warranty, use and
43  * redistribution of this software, in source or object code forms, with or
44  * without modifications are expressly permitted by Whistle Communications;
45  * provided, however, that:
46  * 1. Any and all reproductions of the source or object code must include the
47  *    copyright notice above and the following disclaimer of warranties; and
48  * 2. No rights are granted, in any manner or form, to use Whistle
49  *    Communications, Inc. trademarks, including the mark "WHISTLE
50  *    COMMUNICATIONS" on advertising, endorsements, or otherwise except as
51  *    such appears in the above copyright notice or in the software.
52  *
53  * THIS SOFTWARE IS BEING PROVIDED BY WHISTLE COMMUNICATIONS "AS IS", AND
54  * TO THE MAXIMUM EXTENT PERMITTED BY LAW, WHISTLE COMMUNICATIONS MAKES NO
55  * REPRESENTATIONS OR WARRANTIES, EXPRESS OR IMPLIED, REGARDING THIS SOFTWARE,
56  * INCLUDING WITHOUT LIMITATION, ANY AND ALL IMPLIED WARRANTIES OF
57  * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE, OR NON-INFRINGEMENT.
58  * WHISTLE COMMUNICATIONS DOES NOT WARRANT, GUARANTEE, OR MAKE ANY
59  * REPRESENTATIONS REGARDING THE USE OF, OR THE RESULTS OF THE USE OF THIS
60  * SOFTWARE IN TERMS OF ITS CORRECTNESS, ACCURACY, RELIABILITY OR OTHERWISE.
61  * IN NO EVENT SHALL WHISTLE COMMUNICATIONS BE LIABLE FOR ANY DAMAGES
62  * RESULTING FROM OR ARISING OUT OF ANY USE OF THIS SOFTWARE, INCLUDING
63  * WITHOUT LIMITATION, ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY,
64  * PUNITIVE, OR CONSEQUENTIAL DAMAGES, PROCUREMENT OF SUBSTITUTE GOODS OR
65  * SERVICES, LOSS OF USE, DATA OR PROFITS, HOWEVER CAUSED AND UNDER ANY
66  * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
67  * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF
68  * THIS SOFTWARE, EVEN IF WHISTLE COMMUNICATIONS IS ADVISED OF THE POSSIBILITY
69  * OF SUCH DAMAGE.
70  *
71  * Author: Archie Cobbs <archie@freebsd.org>
72  *
73  * $Whistle: ng_fec.c,v 1.33 1999/11/01 09:24:51 julian Exp $
74  */
75 
76 /*
77  * This module implements ethernet channel bonding using the Cisco
78  * Fast EtherChannel mechanism. Two or four ports may be combined
79  * into a single aggregate interface.
80  *
81  * Interfaces are named fec0, fec1, etc.  New nodes take the
82  * first available interface name.
83  *
84  * This node also includes Berkeley packet filter support.
85  *
86  * Note that this node doesn't need to connect to any other
87  * netgraph nodes in order to do its work.
88  */
89 
90 #include <sys/param.h>
91 #include <sys/systm.h>
92 #include <sys/errno.h>
93 #include <sys/kernel.h>
94 #include <sys/malloc.h>
95 #include <sys/mbuf.h>
96 #include <sys/errno.h>
97 #include <sys/sockio.h>
98 #include <sys/socket.h>
99 #include <sys/syslog.h>
100 #include <sys/libkern.h>
101 #include <sys/queue.h>
102 #include <sys/thread2.h>
103 
104 #include <net/if.h>
105 #include <net/if_types.h>
106 #include <net/if_arp.h>
107 #include <net/if_dl.h>
108 #include <net/if_media.h>
109 #include <net/bpf.h>
110 #include <net/ethernet.h>
111 
112 #include "opt_inet.h"
113 #include "opt_inet6.h"
114 
115 #include <netinet/in.h>
116 #ifdef INET
117 #include <netinet/in_systm.h>
118 #include <netinet/ip.h>
119 #endif
120 
121 #ifdef INET6
122 #include <netinet/ip6.h>
123 #endif
124 
125 #include <netgraph/ng_message.h>
126 #include <netgraph/netgraph.h>
127 #include <netgraph/ng_parse.h>
128 #include "ng_fec.h"
129 
130 #define IFP2NG(ifp)  ((struct ng_node *)((struct arpcom *)(ifp))->ac_netgraph)
131 #define FEC_INC(x, y)	(x) = (x + 1) % y
132 
133 /*
134  * Current fast etherchannel implementations use either 2 or 4
135  * ports, so for now we limit the maximum bundle size to 4 interfaces.
136  */
137 #define FEC_BUNDLESIZ	4
138 
139 struct ng_fec_portlist {
140 	struct ifnet		*fec_if;
141 	int			fec_idx;
142 	int			fec_ifstat;
143 	struct ether_addr	fec_mac;
144 	TAILQ_ENTRY(ng_fec_portlist) fec_list;
145 };
146 
147 struct ng_fec_bundle {
148 	TAILQ_HEAD(,ng_fec_portlist) ng_fec_ports;
149 	int			fec_ifcnt;
150 	int			fec_btype;
151 };
152 
153 #define FEC_BTYPE_MAC		0x01
154 #define FEC_BTYPE_INET		0x02
155 #define FEC_BTYPE_INET6		0x03
156 
157 /* Node private data */
158 struct ng_fec_private {
159 	struct arpcom arpcom;
160 	struct ifmedia ifmedia;
161 	int	if_flags;
162 	int	if_error;		/* XXX */
163 	int	unit;			/* Interface unit number */
164 	node_p	node;			/* Our netgraph node */
165 	struct ng_fec_bundle fec_bundle;/* Aggregate bundle */
166 	struct callout fec_timeout;	/* callout for ticker */
167 	int	(*real_if_output)(struct ifnet *, struct mbuf *,
168 				  struct sockaddr *, struct rtentry *);
169 };
170 typedef struct ng_fec_private *priv_p;
171 
172 /* Interface methods */
173 static void	ng_fec_input(struct ifnet *, struct mbuf **);
174 static void	ng_fec_start(struct ifnet *ifp);
175 static int	ng_fec_choose_port(struct ng_fec_bundle *b,
176 			struct mbuf *m, struct ifnet **ifp);
177 static int	ng_fec_setport(struct ifnet *ifp, u_long cmd, caddr_t data);
178 static void	ng_fec_init(void *arg);
179 static void	ng_fec_stop(struct ifnet *ifp);
180 static int	ng_fec_ifmedia_upd(struct ifnet *ifp);
181 static void	ng_fec_ifmedia_sts(struct ifnet *ifp, struct ifmediareq *ifmr);
182 static int	ng_fec_ioctl(struct ifnet *ifp, u_long cmd, caddr_t data,
183 			     struct ucred *);
184 static int	ng_fec_output(struct ifnet *ifp, struct mbuf *m0,
185 			struct sockaddr *dst, struct rtentry *rt0);
186 static void	ng_fec_tick(void *arg);
187 static int	ng_fec_addport(struct ng_fec_private *priv, char *iface);
188 static int	ng_fec_delport(struct ng_fec_private *priv, char *iface);
189 
190 #ifdef DEBUG
191 static void	ng_fec_print_ioctl(struct ifnet *ifp, int cmd, caddr_t data);
192 #endif
193 
194 /* Netgraph methods */
195 static ng_constructor_t	ng_fec_constructor;
196 static ng_rcvmsg_t	ng_fec_rcvmsg;
197 static ng_shutdown_t	ng_fec_rmnode;
198 
199 /* List of commands and how to convert arguments to/from ASCII */
200 static const struct ng_cmdlist ng_fec_cmds[] = {
201 	{
202 	  NGM_FEC_COOKIE,
203 	  NGM_FEC_ADD_IFACE,
204 	  "add_iface",
205 	  &ng_parse_string_type,
206 	  NULL,
207 	},
208 	{
209 	  NGM_FEC_COOKIE,
210 	  NGM_FEC_DEL_IFACE,
211 	  "del_iface",
212 	  &ng_parse_string_type,
213 	  NULL,
214 	},
215 	{
216 	  NGM_FEC_COOKIE,
217 	  NGM_FEC_SET_MODE_MAC,
218 	  "set_mode_mac",
219 	  NULL,
220 	  NULL,
221 	},
222 	{
223 	  NGM_FEC_COOKIE,
224 	  NGM_FEC_SET_MODE_INET,
225 	  "set_mode_inet",
226 	  NULL,
227 	  NULL,
228 	},
229 	{ 0 }
230 };
231 
232 /* Node type descriptor */
233 static struct ng_type typestruct = {
234 	NG_VERSION,
235 	NG_FEC_NODE_TYPE,
236 	NULL,
237 	ng_fec_constructor,
238 	ng_fec_rcvmsg,
239 	ng_fec_rmnode,
240 	NULL,
241 	NULL,
242 	NULL,
243 	NULL,
244 	NULL,
245 	NULL,
246 	ng_fec_cmds
247 };
248 NETGRAPH_INIT(fec, &typestruct);
249 
250 /* We keep a bitmap indicating which unit numbers are free.
251    One means the unit number is free, zero means it's taken. */
252 static int	*ng_fec_units = NULL;
253 static int	ng_fec_units_len = 0;
254 static int	ng_units_in_use = 0;
255 
256 #define UNITS_BITSPERWORD	(sizeof(*ng_fec_units) * NBBY)
257 
258 /*
259  * Find the first free unit number for a new interface.
260  * Increase the size of the unit bitmap as necessary.
261  */
262 static __inline__ int
263 ng_fec_get_unit(int *unit)
264 {
265 	int index, bit;
266 
267 	for (index = 0; index < ng_fec_units_len
268 	    && ng_fec_units[index] == 0; index++);
269 	if (index == ng_fec_units_len) {		/* extend array */
270 		int i, *newarray, newlen;
271 
272 		newlen = (2 * ng_fec_units_len) + 4;
273 		MALLOC(newarray, int *, newlen * sizeof(*ng_fec_units),
274 		    M_NETGRAPH, M_NOWAIT);
275 		if (newarray == NULL)
276 			return (ENOMEM);
277 		bcopy(ng_fec_units, newarray,
278 		    ng_fec_units_len * sizeof(*ng_fec_units));
279 		for (i = ng_fec_units_len; i < newlen; i++)
280 			newarray[i] = ~0;
281 		if (ng_fec_units != NULL)
282 			FREE(ng_fec_units, M_NETGRAPH);
283 		ng_fec_units = newarray;
284 		ng_fec_units_len = newlen;
285 	}
286 	bit = ffs(ng_fec_units[index]) - 1;
287 	KASSERT(bit >= 0 && bit <= UNITS_BITSPERWORD - 1,
288 	    ("%s: word=%d bit=%d", __func__, ng_fec_units[index], bit));
289 	ng_fec_units[index] &= ~(1 << bit);
290 	*unit = (index * UNITS_BITSPERWORD) + bit;
291 	ng_units_in_use++;
292 	return (0);
293 }
294 
295 /*
296  * Free a no longer needed unit number.
297  */
298 static __inline__ void
299 ng_fec_free_unit(int unit)
300 {
301 	int index, bit;
302 
303 	index = unit / UNITS_BITSPERWORD;
304 	bit = unit % UNITS_BITSPERWORD;
305 	KASSERT(index < ng_fec_units_len,
306 	    ("%s: unit=%d len=%d", __func__, unit, ng_fec_units_len));
307 	KASSERT((ng_fec_units[index] & (1 << bit)) == 0,
308 	    ("%s: unit=%d is free", __func__, unit));
309 	ng_fec_units[index] |= (1 << bit);
310 	/*
311 	 * XXX We could think about reducing the size of ng_fec_units[]
312 	 * XXX here if the last portion is all ones
313 	 * XXX At least free it if no more units.
314 	 * Needed if we are eventually be able to unload.
315 	 */
316 	ng_units_in_use++;
317 	if (ng_units_in_use == 0) { /* XXX make SMP safe */
318 		FREE(ng_fec_units, M_NETGRAPH);
319 		ng_fec_units_len = 0;
320 		ng_fec_units = NULL;
321 	}
322 }
323 
324 /************************************************************************
325 			INTERFACE STUFF
326  ************************************************************************/
327 
328 static int
329 ng_fec_addport(struct ng_fec_private *priv, char *iface)
330 {
331 	struct ng_fec_bundle	*b;
332 	struct ifnet		*ifp, *bifp;
333 	struct arpcom		*ac;
334 	struct sockaddr_dl	*sdl;
335 	struct ng_fec_portlist	*p, *new;
336 
337 	if (priv == NULL || iface == NULL)
338 		return(EINVAL);
339 
340 	b = &priv->fec_bundle;
341 	ifp = &priv->arpcom.ac_if;
342 
343 	/* Find the interface */
344 	bifp = ifunit(iface);
345 	if (bifp == NULL) {
346 		kprintf("fec%d: tried to add iface %s, which "
347 		    "doesn't seem to exist\n", priv->unit, iface);
348 		return(ENOENT);
349 	}
350 
351 	/* See if we have room in the bundle */
352 	if (b->fec_ifcnt == FEC_BUNDLESIZ) {
353 		kprintf("fec%d: can't add new iface; bundle is full\n",
354 		    priv->unit);
355 		return(ENOSPC);
356 	}
357 
358 	/* See if the interface is already in the bundle */
359 	TAILQ_FOREACH(p, &b->ng_fec_ports, fec_list) {
360 		if (p->fec_if == bifp) {
361 			kprintf("fec%d: iface %s is already in this "
362 			    "bundle\n", priv->unit, iface);
363 			return(EINVAL);
364 		}
365 	}
366 
367 	/* Allocate new list entry. */
368 	MALLOC(new, struct ng_fec_portlist *,
369 	    sizeof(struct ng_fec_portlist), M_NETGRAPH, M_NOWAIT);
370 	if (new == NULL)
371 		return(ENOMEM);
372 
373 	ac = (struct arpcom *)bifp;
374 	ac->ac_netgraph = priv->node;
375 
376 	/*
377 	 * If this is the first interface added to the bundle,
378 	 * use its MAC address for the virtual interface (and,
379 	 * by extension, all the other ports in the bundle).
380 	 */
381 	if (b->fec_ifcnt == 0) {
382 		sdl = IF_LLSOCKADDR(ifp);
383 		bcopy((char *)ac->ac_enaddr,
384 		    priv->arpcom.ac_enaddr, ETHER_ADDR_LEN);
385 		bcopy((char *)ac->ac_enaddr,
386 		    LLADDR(sdl), ETHER_ADDR_LEN);
387 	}
388 
389 	b->fec_btype = FEC_BTYPE_MAC;
390 	new->fec_idx = b->fec_ifcnt;
391 	b->fec_ifcnt++;
392 
393 	/* Save the real MAC address. */
394 	bcopy((char *)ac->ac_enaddr,
395 	    (char *)&new->fec_mac, ETHER_ADDR_LEN);
396 
397 	/* Set up phony MAC address. */
398 	sdl = IF_LLSOCKADDR(bifp);
399 	bcopy(priv->arpcom.ac_enaddr, ac->ac_enaddr, ETHER_ADDR_LEN);
400 	bcopy(priv->arpcom.ac_enaddr, LLADDR(sdl), ETHER_ADDR_LEN);
401 
402 	/* Add to the queue */
403 	new->fec_if = bifp;
404 	TAILQ_INSERT_TAIL(&b->ng_fec_ports, new, fec_list);
405 
406 	return(0);
407 }
408 
409 static int
410 ng_fec_delport(struct ng_fec_private *priv, char *iface)
411 {
412 	struct ng_fec_bundle	*b;
413 	struct ifnet		*ifp, *bifp;
414 	struct arpcom		*ac;
415 	struct sockaddr_dl	*sdl;
416 	struct ng_fec_portlist	*p;
417 
418 	if (priv == NULL || iface == NULL)
419 		return(EINVAL);
420 
421 	b = &priv->fec_bundle;
422 	ifp = &priv->arpcom.ac_if;
423 
424 	/* Find the interface */
425 	bifp = ifunit(iface);
426 	if (bifp == NULL) {
427 		kprintf("fec%d: tried to remove iface %s, which "
428 		    "doesn't seem to exist\n", priv->unit, iface);
429 		return(ENOENT);
430 	}
431 
432 	TAILQ_FOREACH(p, &b->ng_fec_ports, fec_list) {
433 		if (p->fec_if == bifp)
434 			break;
435 	}
436 
437 	if (p == NULL) {
438 		kprintf("fec%d: tried to remove iface %s which "
439 		    "is not in our bundle\n", priv->unit, iface);
440 		return(EINVAL);
441 	}
442 
443 	/* Stop interface */
444 	bifp->if_flags &= ~IFF_UP;
445 	bifp->if_ioctl(bifp, SIOCSIFFLAGS, NULL, NULL);
446 
447 	/* Restore MAC address. */
448 	ac = (struct arpcom *)bifp;
449 	sdl = IF_LLSOCKADDR(bifp);
450 	bcopy((char *)&p->fec_mac, ac->ac_enaddr, ETHER_ADDR_LEN);
451 	bcopy((char *)&p->fec_mac, LLADDR(sdl), ETHER_ADDR_LEN);
452 
453 	/* Delete port */
454 	TAILQ_REMOVE(&b->ng_fec_ports, p, fec_list);
455 	FREE(p, M_NETGRAPH);
456 	b->fec_ifcnt--;
457 
458 	return(0);
459 }
460 
461 /*
462  * Pass an ioctl command down to all the underyling interfaces in a
463  * bundle. Used for setting multicast filters and flags.
464  */
465 static int
466 ng_fec_setport(struct ifnet *ifp, u_long command, caddr_t data)
467 {
468 	struct ng_fec_private	*priv;
469 	struct ng_fec_bundle	*b;
470 	struct ifnet		*oifp;
471 	struct ng_fec_portlist	*p;
472 
473 	priv = ifp->if_softc;
474 	b = &priv->fec_bundle;
475 
476 	lwkt_serialize_exit(ifp->if_serializer);	/* XXX */
477 	TAILQ_FOREACH(p, &b->ng_fec_ports, fec_list) {
478 		oifp = p->fec_if;
479 		if (oifp != NULL) {
480 			lwkt_serialize_enter(oifp->if_serializer);
481 			oifp->if_ioctl(oifp, command, data, NULL);
482 			lwkt_serialize_exit(oifp->if_serializer);
483 		}
484 	}
485 	lwkt_serialize_enter(ifp->if_serializer);
486 
487 	return(0);
488 }
489 
490 static void
491 ng_fec_init(void *arg)
492 {
493 	struct ng_fec_private	*priv;
494 	struct ng_fec_bundle	*b;
495 	struct ifnet		*ifp, *bifp;
496 	struct ng_fec_portlist	*p;
497 
498 	ifp = arg;
499 	priv = ifp->if_softc;
500 	b = &priv->fec_bundle;
501 
502 	if (b->fec_ifcnt == 1 || b->fec_ifcnt == 3) {
503 		kprintf("fec%d: invalid bundle "
504 		    "size: %d\n", priv->unit,
505 		    b->fec_ifcnt);
506 		return;
507 	}
508 
509 	ng_fec_stop(ifp);
510 
511 	lwkt_serialize_exit(ifp->if_serializer);	/* XXX */
512 	TAILQ_FOREACH(p, &b->ng_fec_ports, fec_list) {
513 		bifp = p->fec_if;
514 		lwkt_serialize_enter(bifp->if_serializer);
515 		bifp->if_flags |= IFF_UP;
516                 bifp->if_ioctl(bifp, SIOCSIFFLAGS, NULL, NULL);
517 		/* mark iface as up and let the monitor check it */
518 		p->fec_ifstat = -1;
519 		lwkt_serialize_exit(bifp->if_serializer);
520 	}
521 	lwkt_serialize_enter(ifp->if_serializer);
522 
523 	callout_reset(&priv->fec_timeout, hz, ng_fec_tick, priv);
524 }
525 
526 static void
527 ng_fec_stop(struct ifnet *ifp)
528 {
529 	struct ng_fec_private	*priv;
530 	struct ng_fec_bundle	*b;
531 	struct ifnet		*bifp;
532 	struct ng_fec_portlist	*p;
533 
534 	priv = ifp->if_softc;
535 	b = &priv->fec_bundle;
536 
537 	lwkt_serialize_exit(ifp->if_serializer);	/* XXX */
538 	TAILQ_FOREACH(p, &b->ng_fec_ports, fec_list) {
539 		bifp = p->fec_if;
540 		lwkt_serialize_enter(bifp->if_serializer);
541 		bifp->if_flags &= ~IFF_UP;
542                 bifp->if_ioctl(bifp, SIOCSIFFLAGS, NULL, NULL);
543 		lwkt_serialize_exit(bifp->if_serializer);
544 	}
545 	callout_stop(&priv->fec_timeout);
546 	lwkt_serialize_enter(ifp->if_serializer);	/* XXX */
547 }
548 
549 static void
550 ng_fec_tick(void *arg)
551 {
552 	struct ng_fec_private	*priv;
553 	struct ng_fec_bundle	*b;
554         struct ifmediareq	ifmr;
555 	struct ifnet		*ifp;
556 	struct ng_fec_portlist	*p;
557 	int			error = 0;
558 
559 	priv = arg;
560 	b = &priv->fec_bundle;
561 
562 	/*
563 	 * Note: serializer for parent interface not held on entry, and
564 	 * cannot be held during the loop to avoid a deadlock.
565 	 */
566 	TAILQ_FOREACH(p, &b->ng_fec_ports, fec_list) {
567 		bzero((char *)&ifmr, sizeof(ifmr));
568 		ifp = p->fec_if;
569 		lwkt_serialize_enter(ifp->if_serializer);
570 		error = ifp->if_ioctl(ifp, SIOCGIFMEDIA, (caddr_t)&ifmr, NULL);
571 		if (error) {
572 			kprintf("fec%d: failed to check status "
573 			    "of link %s\n", priv->unit, ifp->if_xname);
574 			lwkt_serialize_exit(ifp->if_serializer);
575 			continue;
576 		}
577 
578         	if (ifmr.ifm_status & IFM_AVALID &&
579                     IFM_TYPE(ifmr.ifm_active) == IFM_ETHER) {
580 			if (ifmr.ifm_status & IFM_ACTIVE) {
581 				if (p->fec_ifstat == -1 ||
582 				    p->fec_ifstat == 0) {
583 					p->fec_ifstat = 1;
584 					kprintf("fec%d: port %s in bundle "
585 					    "is up\n", priv->unit,
586 					    ifp->if_xname);
587 				}
588 			} else {
589 				if (p->fec_ifstat == -1 ||
590 				    p->fec_ifstat == 1) {
591 					p->fec_ifstat = 0;
592 					kprintf("fec%d: port %s in bundle "
593 					    "is down\n", priv->unit,
594 					    ifp->if_xname);
595 				}
596 			}
597 		}
598 		lwkt_serialize_exit(ifp->if_serializer);
599 	}
600 
601 	ifp = &priv->arpcom.ac_if;
602 	if (ifp->if_flags & IFF_RUNNING)
603 		callout_reset(&priv->fec_timeout, hz, ng_fec_tick, priv);
604 }
605 
606 static int
607 ng_fec_ifmedia_upd(struct ifnet *ifp)
608 {
609 	return(0);
610 }
611 
612 static void
613 ng_fec_ifmedia_sts(struct ifnet *ifp, struct ifmediareq *ifmr)
614 {
615 	struct ng_fec_private	*priv;
616 	struct ng_fec_bundle	*b;
617 	struct ng_fec_portlist	*p;
618 
619 	priv = ifp->if_softc;
620 	b = &priv->fec_bundle;
621 
622 	ifmr->ifm_status = IFM_AVALID;
623 	TAILQ_FOREACH(p, &b->ng_fec_ports, fec_list) {
624 		if (p->fec_ifstat) {
625 			ifmr->ifm_status |= IFM_ACTIVE;
626 			break;
627 		}
628 	}
629 }
630 
631 /*
632  * Process an ioctl for the virtual interface
633  */
634 static int
635 ng_fec_ioctl(struct ifnet *ifp, u_long command, caddr_t data, struct ucred *cr)
636 {
637 	struct ifreq *const ifr = (struct ifreq *) data;
638 	int error = 0;
639 	struct ng_fec_private	*priv;
640 	struct ng_fec_bundle	*b;
641 
642 	priv = ifp->if_softc;
643 	b = &priv->fec_bundle;
644 
645 #ifdef DEBUG
646 	ng_fec_print_ioctl(ifp, command, data);
647 #endif
648 	crit_enter();
649 	switch (command) {
650 
651 	/* These two are mostly handled at a higher layer */
652 	case SIOCSIFADDR:
653 	case SIOCGIFADDR:
654 	case SIOCSIFMTU:
655 		error = ether_ioctl(ifp, command, data);
656 		break;
657 
658 	/* Set flags */
659 	case SIOCSIFFLAGS:
660 		/*
661 		 * If the interface is marked up and stopped, then start it.
662 		 * If it is marked down and running, then stop it.
663 		 */
664 		if (ifr->ifr_flags & IFF_UP) {
665 			if (!(ifp->if_flags & IFF_RUNNING)) {
666 				/* Sanity. */
667 				if (b->fec_ifcnt == 1 || b->fec_ifcnt == 3) {
668 					kprintf("fec%d: invalid bundle "
669 					    "size: %d\n", priv->unit,
670 					    b->fec_ifcnt);
671 					error = EINVAL;
672 					break;
673 				}
674 				ifp->if_flags &= ~(IFF_OACTIVE);
675 				ifp->if_flags |= IFF_RUNNING;
676 				ng_fec_init(ifp);
677 			}
678 			/*
679 			 * Bubble down changes in promisc mode to
680 			 * underlying interfaces.
681 			 */
682 			if ((ifp->if_flags & IFF_PROMISC) !=
683 			    (priv->if_flags & IFF_PROMISC)) {
684 				ng_fec_setport(ifp, command, data);
685 				priv->if_flags = ifp->if_flags;
686 			}
687 		} else {
688 			if (ifp->if_flags & IFF_RUNNING)
689 				ifp->if_flags &= ~(IFF_RUNNING | IFF_OACTIVE);
690 			ng_fec_stop(ifp);
691 		}
692 		break;
693 
694 	case SIOCADDMULTI:
695 	case SIOCDELMULTI:
696 		ng_fec_setport(ifp, command, data);
697 		error = 0;
698 		break;
699 	case SIOCGIFMEDIA:
700 	case SIOCSIFMEDIA:
701 		error = ifmedia_ioctl(ifp, ifr, &priv->ifmedia, command);
702 		break;
703 	/* Stuff that's not supported */
704 	case SIOCSIFPHYS:
705 		error = EOPNOTSUPP;
706 		break;
707 
708 	default:
709 		error = EINVAL;
710 		break;
711 	}
712 	crit_exit();
713 	return (error);
714 }
715 
716 /*
717  * This routine spies on mbufs passing through ether_input(). If
718  * they come from one of the interfaces that are aggregated into
719  * our bundle, we fix up the ifnet pointer and increment our
720  * packet counters so that it looks like the frames are actually
721  * coming from us.
722  */
723 static void
724 ng_fec_input(struct ifnet *ifp, struct mbuf **m0)
725 {
726 	struct ng_node		*node;
727 	struct ng_fec_private	*priv;
728 	struct ng_fec_bundle	*b;
729 	struct mbuf		*m;
730 	struct ifnet		*bifp;
731 	struct ng_fec_portlist	*p;
732 
733 	/* Sanity check */
734 	if (ifp == NULL || m0 == NULL)
735 		return;
736 
737 	node = IFP2NG(ifp);
738 
739 	/* Sanity check part II */
740 	if (node == NULL)
741 		return;
742 
743 	priv = node->private;
744 	b = &priv->fec_bundle;
745 	bifp = &priv->arpcom.ac_if;
746 
747 	m = *m0;
748 	TAILQ_FOREACH(p, &b->ng_fec_ports, fec_list) {
749 		if (p->fec_if == m->m_pkthdr.rcvif)
750 			break;
751 	}
752 
753 	/* Wasn't meant for us; leave this frame alone. */
754 	if (p == NULL)
755 		return;
756 
757 	/* Pretend this is our frame. */
758 	m->m_pkthdr.rcvif = bifp;
759 	bifp->if_ipackets++;
760 	bifp->if_ibytes += m->m_pkthdr.len;
761 
762 	if (bifp->if_bpf)
763 		bpf_mtap(bifp->if_bpf, m);
764 }
765 
766 /*
767  * Take a quick peek at the packet and see if it's ok for us to use
768  * the inet or inet6 hash methods on it, if they're enabled. We do
769  * this by setting flags in the mbuf header. Once we've made up our
770  * mind what to do, we pass the frame to ether_output() for further
771  * processing.
772  */
773 
774 static int
775 ng_fec_output_serialized(struct ifnet *ifp, struct mbuf *m,
776 			 struct sockaddr *dst, struct rtentry *rt0)
777 {
778 	const priv_p priv = (priv_p) ifp->if_softc;
779 	struct ng_fec_bundle *b;
780 	int error;
781 
782 	/* Check interface flags */
783 	if ((ifp->if_flags & (IFF_UP|IFF_RUNNING)) != (IFF_UP|IFF_RUNNING)) {
784 		m_freem(m);
785 		return (ENETDOWN);
786 	}
787 
788 	b = &priv->fec_bundle;
789 
790 	switch (b->fec_btype) {
791 	case FEC_BTYPE_MAC:
792 		m->m_flags |= M_FEC_MAC;
793 		break;
794 #ifdef INET
795 	case FEC_BTYPE_INET:
796 		/*
797 		 * We can't use the INET address port selection
798 		 * scheme if this isn't an INET packet.
799 		 */
800 		if (dst->sa_family == AF_INET)
801 			m->m_flags |= M_FEC_INET;
802 #ifdef INET6
803 		else if (dst->sa_family == AF_INET6)
804 			m->m_flags |= M_FEC_INET6;
805 #endif
806 		else {
807 #ifdef DEBUG
808 			kprintf("%s: can't do inet aggregation of non "
809 			    "inet packet\n", ifp->if_xname);
810 #endif
811 			m->m_flags |= M_FEC_MAC;
812 		}
813 		break;
814 #endif
815 	default:
816 		kprintf("%s: bogus hash type: %d\n", ifp->if_xname,
817 		    b->fec_btype);
818 		m_freem(m);
819 		return(EINVAL);
820 		break;
821 	}
822 
823 	/*
824 	 * Pass the frame to ether_output() for all the protocol
825 	 * handling. This will put the ethernet header on the packet
826 	 * for us.
827 	 */
828 	priv->if_error = 0;
829 	error = priv->real_if_output(ifp, m, dst, rt0);
830 	if (priv->if_error && !error)
831 		error = priv->if_error;
832 
833 	return(error);
834 }
835 
836 static int
837 ng_fec_output(struct ifnet *ifp, struct mbuf *m,
838 	      struct sockaddr *dst, struct rtentry *rt0)
839 {
840 	int error;
841 
842 	lwkt_serialize_enter(ifp->if_serializer);
843 	error = ng_fec_output_serialized(ifp, m, dst, rt0);
844 	lwkt_serialize_exit(ifp->if_serializer);
845 
846 	return error;
847 }
848 
849 /*
850  * Apply a hash to the source and destination addresses in the packet
851  * in order to select an interface. Also check link status and handle
852  * dead links accordingly.
853  */
854 
855 static int
856 ng_fec_choose_port(struct ng_fec_bundle *b,
857 	struct mbuf *m, struct ifnet **ifp)
858 {
859 	struct ether_header	*eh;
860 	struct mbuf		*m0;
861 #ifdef INET
862 	struct ip		*ip;
863 #ifdef INET6
864 	struct ip6_hdr		*ip6;
865 #endif
866 #endif
867 
868 	struct ng_fec_portlist	*p;
869 	int			port = 0, mask;
870 
871 	/*
872 	 * If there are only two ports, mask off all but the
873 	 * last bit for XORing. If there are 4, mask off all
874 	 * but the last 2 bits.
875 	 */
876 	mask = b->fec_ifcnt == 2 ? 0x1 : 0x3;
877 	eh = mtod(m, struct ether_header *);
878 #ifdef INET
879 	ip = (struct ip *)(mtod(m, char *) +
880 	    sizeof(struct ether_header));
881 #ifdef INET6
882 	ip6 = (struct ip6_hdr *)(mtod(m, char *) +
883 	    sizeof(struct ether_header));
884 #endif
885 #endif
886 
887 	/*
888 	 * The fg_fec_output() routine is supposed to leave a
889 	 * flag for us in the mbuf that tells us what hash to
890 	 * use, but sometimes a new mbuf is prepended to the
891 	 * chain, so we have to search every mbuf in the chain
892 	 * to find the flags.
893 	 */
894 	m0 = m;
895 	while (m0) {
896 		if (m0->m_flags & (M_FEC_MAC|M_FEC_INET|M_FEC_INET6))
897 			break;
898 		m0 = m0->m_next;
899 	}
900 	if (m0 == NULL)
901 		return(EINVAL);
902 
903 	switch (m0->m_flags & (M_FEC_MAC|M_FEC_INET|M_FEC_INET6)) {
904 	case M_FEC_MAC:
905 		port = (eh->ether_dhost[5] ^
906 		    eh->ether_shost[5]) & mask;
907 		break;
908 #ifdef INET
909 	case M_FEC_INET:
910 		port = (ntohl(ip->ip_dst.s_addr) ^
911 		    ntohl(ip->ip_src.s_addr)) & mask;
912 		break;
913 #ifdef INET6
914 	case M_FEC_INET6:
915 		port = (ip6->ip6_dst.s6_addr[15] ^
916 		    ip6->ip6_dst.s6_addr[15]) & mask;
917 		break;
918 #endif
919 #endif
920 	default:
921 		return(EINVAL);
922 			break;
923 	}
924 
925 	TAILQ_FOREACH(p, &b->ng_fec_ports, fec_list) {
926 		if (port == p->fec_idx)
927 			break;
928 	}
929 
930 	/*
931 	 * Now that we've chosen a port, make sure it's
932 	 * alive. If it's not alive, cycle through the bundle
933 	 * looking for a port that is alive. If we don't find
934 	 * any, return an error.
935 	 */
936 	if (p->fec_ifstat != 1) {
937 		struct ng_fec_portlist	*n = NULL;
938 
939 		n = TAILQ_NEXT(p, fec_list);
940 		if (n == NULL)
941 			n = TAILQ_FIRST(&b->ng_fec_ports);
942 		while (n != p) {
943 			if (n->fec_ifstat == 1)
944 				break;
945 			n = TAILQ_NEXT(n, fec_list);
946 			if (n == NULL)
947 				n = TAILQ_FIRST(&b->ng_fec_ports);
948 		}
949 		if (n == p)
950 			return(EAGAIN);
951 		p = n;
952 	}
953 
954 	*ifp = p->fec_if;
955 
956 	return(0);
957 }
958 
959 /*
960  * Now that the packet has been run through ether_output(), yank it
961  * off our own send queue and stick it on the queue for the appropriate
962  * underlying physical interface. Note that if the interface's send
963  * queue is full, we save an error status in our private netgraph
964  * space which will eventually be handed up to ng_fec_output(), which
965  * will return it to the rest of the IP stack. We need to do this
966  * in order to duplicate the effect of ether_output() returning ENOBUFS
967  * when it detects that an interface's send queue is full. There's no
968  * other way to signal the error status from here since the if_start()
969  * routine is spec'ed to return void.
970  *
971  * Once the frame is queued, we call ether_output_frame() to initiate
972  * transmission.
973  */
974 static void
975 ng_fec_start(struct ifnet *ifp)
976 {
977 	struct ng_fec_private	*priv;
978 	struct ng_fec_bundle	*b;
979 	struct ifnet		*oifp = NULL;
980 	struct mbuf		*m0;
981 	int			error;
982 
983 	priv = ifp->if_softc;
984 	b = &priv->fec_bundle;
985 
986 	IF_DEQUEUE(&ifp->if_snd, m0);
987 	if (m0 == NULL)
988 		return;
989 
990 	BPF_MTAP(ifp, m0);
991 
992 	/* Queue up packet on the proper port. */
993 	error = ng_fec_choose_port(b, m0, &oifp);
994 	if (error) {
995 		ifp->if_ierrors++;
996 		m_freem(m0);
997 		priv->if_error = ENOBUFS;
998 		return;
999 	}
1000 	ifp->if_opackets++;
1001 
1002 	/*
1003 	 * Release current iface's serializer to avoid possible dead lock
1004 	 */
1005 	lwkt_serialize_exit(ifp->if_serializer);
1006 	priv->if_error = ether_output_frame(oifp, m0);
1007 	lwkt_serialize_enter(ifp->if_serializer);
1008 }
1009 
1010 #ifdef DEBUG
1011 /*
1012  * Display an ioctl to the virtual interface
1013  */
1014 
1015 static void
1016 ng_fec_print_ioctl(struct ifnet *ifp, int command, caddr_t data)
1017 {
1018 	char   *str;
1019 
1020 	switch (command & IOC_DIRMASK) {
1021 	case IOC_VOID:
1022 		str = "IO";
1023 		break;
1024 	case IOC_OUT:
1025 		str = "IOR";
1026 		break;
1027 	case IOC_IN:
1028 		str = "IOW";
1029 		break;
1030 	case IOC_INOUT:
1031 		str = "IORW";
1032 		break;
1033 	default:
1034 		str = "IO??";
1035 	}
1036 	log(LOG_DEBUG, "%s: %s('%c', %d, char[%d])\n",
1037 	       ifp->if_xname,
1038 	       str,
1039 	       IOCGROUP(command),
1040 	       command & 0xff,
1041 	       IOCPARM_LEN(command));
1042 }
1043 #endif /* DEBUG */
1044 
1045 /************************************************************************
1046 			NETGRAPH NODE STUFF
1047  ************************************************************************/
1048 
1049 /*
1050  * Constructor for a node
1051  */
1052 static int
1053 ng_fec_constructor(node_p *nodep)
1054 {
1055 	char ifname[NG_FEC_FEC_NAME_MAX + 1];
1056 	struct ifnet *ifp;
1057 	node_p node;
1058 	priv_p priv;
1059 	struct ng_fec_bundle *b;
1060 	int error = 0;
1061 
1062 	/* Allocate node and interface private structures */
1063 	MALLOC(priv, priv_p, sizeof(*priv), M_NETGRAPH, M_NOWAIT | M_ZERO);
1064 	if (priv == NULL)
1065 		return (ENOMEM);
1066 
1067 	ifp = &priv->arpcom.ac_if;
1068 	b = &priv->fec_bundle;
1069 
1070 	/* Link them together */
1071 	ifp->if_softc = priv;
1072 
1073 	/* Get an interface unit number */
1074 	if ((error = ng_fec_get_unit(&priv->unit)) != 0) {
1075 		FREE(ifp, M_NETGRAPH);
1076 		FREE(priv, M_NETGRAPH);
1077 		return (error);
1078 	}
1079 
1080 	/* Call generic node constructor */
1081 	if ((error = ng_make_node_common(&typestruct, nodep)) != 0) {
1082 		ng_fec_free_unit(priv->unit);
1083 		FREE(ifp, M_NETGRAPH);
1084 		FREE(priv, M_NETGRAPH);
1085 		return (error);
1086 	}
1087 	node = *nodep;
1088 
1089 	/* Link together node and private info */
1090 	node->private = priv;
1091 	priv->node = node;
1092 	priv->arpcom.ac_netgraph = node;
1093 
1094 	/* Initialize interface structure */
1095 	if_initname(ifp, NG_FEC_FEC_NAME, priv->unit);
1096 	ifp->if_start = ng_fec_start;
1097 	ifp->if_ioctl = ng_fec_ioctl;
1098 	ifp->if_init = ng_fec_init;
1099 	ifp->if_watchdog = NULL;
1100 	ifp->if_snd.ifq_maxlen = IFQ_MAXLEN;
1101 	ifp->if_mtu = NG_FEC_MTU_DEFAULT;
1102 	ifp->if_flags = (IFF_SIMPLEX|IFF_BROADCAST|IFF_MULTICAST);
1103 	ifp->if_type = IFT_PROPVIRTUAL;		/* XXX */
1104 	ifp->if_addrlen = 0;			/* XXX */
1105 	ifp->if_hdrlen = 0;			/* XXX */
1106 	ifp->if_baudrate = 100000000;		/* XXX */
1107 
1108 	/* Give this node the same name as the interface (if possible) */
1109 	bzero(ifname, sizeof(ifname));
1110 	strlcpy(ifname, ifp->if_xname, sizeof(ifname));
1111 	if (ng_name_node(node, ifname) != 0)
1112 		log(LOG_WARNING, "%s: can't acquire netgraph name\n", ifname);
1113 
1114 	/* Grab hold of the ether_input pipe. */
1115 	if (ng_ether_input_p == NULL)
1116 		ng_ether_input_p = ng_fec_input;
1117 
1118 	/* Attach the interface */
1119 	ether_ifattach(ifp, priv->arpcom.ac_enaddr, NULL);
1120 	priv->real_if_output = ifp->if_output;
1121 	ifp->if_output = ng_fec_output;
1122 	callout_init(&priv->fec_timeout);
1123 
1124 	TAILQ_INIT(&b->ng_fec_ports);
1125 	b->fec_ifcnt = 0;
1126 
1127 	ifmedia_init(&priv->ifmedia, 0,
1128 	    ng_fec_ifmedia_upd, ng_fec_ifmedia_sts);
1129 	ifmedia_add(&priv->ifmedia, IFM_ETHER|IFM_NONE, 0, NULL);
1130 	ifmedia_set(&priv->ifmedia, IFM_ETHER|IFM_NONE);
1131 
1132 	/* Done */
1133 	return (0);
1134 }
1135 
1136 /*
1137  * Receive a control message
1138  */
1139 static int
1140 ng_fec_rcvmsg(node_p node, struct ng_mesg *msg,
1141 		const char *retaddr, struct ng_mesg **rptr)
1142 {
1143 	const priv_p priv = node->private;
1144 	struct ng_fec_bundle	*b;
1145 	struct ng_mesg *resp = NULL;
1146 	char *ifname;
1147 	int error = 0;
1148 
1149 	b = &priv->fec_bundle;
1150 
1151 	switch (msg->header.typecookie) {
1152 	case NGM_FEC_COOKIE:
1153 		switch (msg->header.cmd) {
1154 		case NGM_FEC_ADD_IFACE:
1155 			ifname = msg->data;
1156 			error = ng_fec_addport(priv, ifname);
1157 			break;
1158 		case NGM_FEC_DEL_IFACE:
1159 			ifname = msg->data;
1160 			error = ng_fec_delport(priv, ifname);
1161 			break;
1162 		case NGM_FEC_SET_MODE_MAC:
1163 			b->fec_btype = FEC_BTYPE_MAC;
1164 			break;
1165 #ifdef INET
1166 		case NGM_FEC_SET_MODE_INET:
1167 			b->fec_btype = FEC_BTYPE_INET;
1168 			break;
1169 #ifdef INET6
1170 		case NGM_FEC_SET_MODE_INET6:
1171 			b->fec_btype = FEC_BTYPE_INET6;
1172 			break;
1173 #endif
1174 #endif
1175 		default:
1176 			error = EINVAL;
1177 			break;
1178 		}
1179 		break;
1180 	default:
1181 		error = EINVAL;
1182 		break;
1183 	}
1184 	if (rptr)
1185 		*rptr = resp;
1186 	else if (resp)
1187 		FREE(resp, M_NETGRAPH);
1188 	FREE(msg, M_NETGRAPH);
1189 	return (error);
1190 }
1191 
1192 /*
1193  * Shutdown and remove the node and its associated interface.
1194  */
1195 static int
1196 ng_fec_rmnode(node_p node)
1197 {
1198 	const priv_p priv = node->private;
1199 	struct ng_fec_bundle *b;
1200 	struct ng_fec_portlist	*p;
1201 	char ifname[IFNAMSIZ];
1202 
1203 	b = &priv->fec_bundle;
1204 	ng_fec_stop(&priv->arpcom.ac_if);
1205 
1206 	while (!TAILQ_EMPTY(&b->ng_fec_ports)) {
1207 		p = TAILQ_FIRST(&b->ng_fec_ports);
1208 		ksprintf(ifname, "%s",
1209 		    p->fec_if->if_xname); /* XXX: strings */
1210 		ng_fec_delport(priv, ifname);
1211 	}
1212 
1213 	ng_cutlinks(node);
1214 	ng_unname(node);
1215 	if (ng_ether_input_p != NULL)
1216 		ng_ether_input_p = NULL;
1217 	ether_ifdetach(&priv->arpcom.ac_if);
1218 	ifmedia_removeall(&priv->ifmedia);
1219 	ng_fec_free_unit(priv->unit);
1220 	FREE(priv, M_NETGRAPH);
1221 	node->private = NULL;
1222 	ng_unref(node);
1223 	return (0);
1224 }
1225