xref: /dragonfly/sys/netgraph/fec/ng_fec.c (revision a3127495)
1 /*
2  * ng_fec.c
3  *
4  * Copyright (c) 2001 Berkeley Software Design, Inc.
5  * Copyright (c) 2000, 2001
6  *	Bill Paul <wpaul@osd.bsdi.com>.  All rights reserved.
7  *
8  * Redistribution and use in source and binary forms, with or without
9  * modification, are permitted provided that the following conditions
10  * are met:
11  * 1. Redistributions of source code must retain the above copyright
12  *    notice, this list of conditions and the following disclaimer.
13  * 2. Redistributions in binary form must reproduce the above copyright
14  *    notice, this list of conditions and the following disclaimer in the
15  *    documentation and/or other materials provided with the distribution.
16  * 3. All advertising materials mentioning features or use of this software
17  *    must display the following acknowledgement:
18  *	This product includes software developed by Bill Paul.
19  * 4. Neither the name of the author nor the names of any co-contributors
20  *    may be used to endorse or promote products derived from this software
21  *    without specific prior written permission.
22  *
23  * THIS SOFTWARE IS PROVIDED BY Bill Paul AND CONTRIBUTORS ``AS IS'' AND
24  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
25  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
26  * ARE DISCLAIMED.  IN NO EVENT SHALL Bill Paul OR THE VOICES IN HIS HEAD
27  * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
28  * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
29  * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
30  * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
31  * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
32  * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF
33  * THE POSSIBILITY OF SUCH DAMAGE.
34  *
35  * $FreeBSD: src/sys/netgraph/ng_fec.c,v 1.1.2.1 2002/11/01 21:39:31 julian Exp $
36  */
37 /*
38  * Copyright (c) 1996-1999 Whistle Communications, Inc.
39  * All rights reserved.
40  *
41  * Subject to the following obligations and disclaimer of warranty, use and
42  * redistribution of this software, in source or object code forms, with or
43  * without modifications are expressly permitted by Whistle Communications;
44  * provided, however, that:
45  * 1. Any and all reproductions of the source or object code must include the
46  *    copyright notice above and the following disclaimer of warranties; and
47  * 2. No rights are granted, in any manner or form, to use Whistle
48  *    Communications, Inc. trademarks, including the mark "WHISTLE
49  *    COMMUNICATIONS" on advertising, endorsements, or otherwise except as
50  *    such appears in the above copyright notice or in the software.
51  *
52  * THIS SOFTWARE IS BEING PROVIDED BY WHISTLE COMMUNICATIONS "AS IS", AND
53  * TO THE MAXIMUM EXTENT PERMITTED BY LAW, WHISTLE COMMUNICATIONS MAKES NO
54  * REPRESENTATIONS OR WARRANTIES, EXPRESS OR IMPLIED, REGARDING THIS SOFTWARE,
55  * INCLUDING WITHOUT LIMITATION, ANY AND ALL IMPLIED WARRANTIES OF
56  * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE, OR NON-INFRINGEMENT.
57  * WHISTLE COMMUNICATIONS DOES NOT WARRANT, GUARANTEE, OR MAKE ANY
58  * REPRESENTATIONS REGARDING THE USE OF, OR THE RESULTS OF THE USE OF THIS
59  * SOFTWARE IN TERMS OF ITS CORRECTNESS, ACCURACY, RELIABILITY OR OTHERWISE.
60  * IN NO EVENT SHALL WHISTLE COMMUNICATIONS BE LIABLE FOR ANY DAMAGES
61  * RESULTING FROM OR ARISING OUT OF ANY USE OF THIS SOFTWARE, INCLUDING
62  * WITHOUT LIMITATION, ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY,
63  * PUNITIVE, OR CONSEQUENTIAL DAMAGES, PROCUREMENT OF SUBSTITUTE GOODS OR
64  * SERVICES, LOSS OF USE, DATA OR PROFITS, HOWEVER CAUSED AND UNDER ANY
65  * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
66  * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF
67  * THIS SOFTWARE, EVEN IF WHISTLE COMMUNICATIONS IS ADVISED OF THE POSSIBILITY
68  * OF SUCH DAMAGE.
69  *
70  * Author: Archie Cobbs <archie@freebsd.org>
71  *
72  * $Whistle: ng_fec.c,v 1.33 1999/11/01 09:24:51 julian Exp $
73  */
74 
75 /*
76  * This module implements ethernet channel bonding using the Cisco
77  * Fast EtherChannel mechanism. Two or four ports may be combined
78  * into a single aggregate interface.
79  *
80  * Interfaces are named fec0, fec1, etc.  New nodes take the
81  * first available interface name.
82  *
83  * This node also includes Berkeley packet filter support.
84  *
85  * Note that this node doesn't need to connect to any other
86  * netgraph nodes in order to do its work.
87  */
88 
89 #include <sys/param.h>
90 #include <sys/systm.h>
91 #include <sys/errno.h>
92 #include <sys/kernel.h>
93 #include <sys/malloc.h>
94 #include <sys/mbuf.h>
95 #include <sys/sockio.h>
96 #include <sys/socket.h>
97 #include <sys/syslog.h>
98 #include <sys/libkern.h>
99 #include <sys/queue.h>
100 #include <sys/thread2.h>
101 
102 #include <net/if.h>
103 #include <net/if_types.h>
104 #include <net/if_arp.h>
105 #include <net/if_dl.h>
106 #include <net/if_media.h>
107 #include <net/ifq_var.h>
108 #include <net/bpf.h>
109 #include <net/ethernet.h>
110 
111 #include "opt_inet.h"
112 #include "opt_inet6.h"
113 
114 #include <netinet/in.h>
115 #ifdef INET
116 #include <netinet/in_systm.h>
117 #include <netinet/ip.h>
118 #endif
119 
120 #ifdef INET6
121 #include <netinet/ip6.h>
122 #endif
123 
124 #include <netgraph/ng_message.h>
125 #include <netgraph/netgraph.h>
126 #include <netgraph/ng_parse.h>
127 #include "ng_fec.h"
128 
129 #define IFP2NG(ifp)  ((struct ng_node *)((struct arpcom *)(ifp))->ac_netgraph)
130 #define FEC_INC(x, y)	(x) = (x + 1) % y
131 
132 /*
133  * Current fast etherchannel implementations use either 2 or 4
134  * ports, so for now we limit the maximum bundle size to 4 interfaces.
135  */
136 #define FEC_BUNDLESIZ	4
137 
138 struct ng_fec_portlist {
139 	struct ifnet		*fec_if;
140 	int			fec_idx;
141 	int			fec_ifstat;
142 	struct ether_addr	fec_mac;
143 	TAILQ_ENTRY(ng_fec_portlist) fec_list;
144 };
145 
146 struct ng_fec_bundle {
147 	TAILQ_HEAD(,ng_fec_portlist) ng_fec_ports;
148 	int			fec_ifcnt;
149 	int			fec_btype;
150 };
151 
152 #define FEC_BTYPE_MAC		0x01
153 #define FEC_BTYPE_INET		0x02
154 #define FEC_BTYPE_INET6		0x03
155 
156 /* Node private data */
157 struct ng_fec_private {
158 	struct arpcom arpcom;
159 	struct ifmedia ifmedia;
160 	int	if_flags;
161 	int	if_error;		/* XXX */
162 	int	unit;			/* Interface unit number */
163 	node_p	node;			/* Our netgraph node */
164 	struct ng_fec_bundle fec_bundle;/* Aggregate bundle */
165 	struct callout fec_timeout;	/* callout for ticker */
166 	int	(*real_if_output)(struct ifnet *, struct mbuf *,
167 				  struct sockaddr *, struct rtentry *);
168 };
169 typedef struct ng_fec_private *priv_p;
170 
171 /* Interface methods */
172 static void	ng_fec_input(struct ifnet *, struct mbuf **);
173 static void	ng_fec_start(struct ifnet *ifp, struct ifaltq_subque *);
174 static int	ng_fec_choose_port(struct ng_fec_bundle *b,
175 			struct mbuf *m, struct ifnet **ifp);
176 static int	ng_fec_setport(struct ifnet *ifp, u_long cmd, caddr_t data);
177 static void	ng_fec_init(void *arg);
178 static void	ng_fec_stop(struct ifnet *ifp);
179 static int	ng_fec_ifmedia_upd(struct ifnet *ifp);
180 static void	ng_fec_ifmedia_sts(struct ifnet *ifp, struct ifmediareq *ifmr);
181 static int	ng_fec_ioctl(struct ifnet *ifp, u_long cmd, caddr_t data,
182 			     struct ucred *);
183 static int	ng_fec_output(struct ifnet *ifp, struct mbuf *m0,
184 			struct sockaddr *dst, struct rtentry *rt0);
185 static void	ng_fec_tick(void *arg);
186 static int	ng_fec_addport(struct ng_fec_private *priv, char *iface);
187 static int	ng_fec_delport(struct ng_fec_private *priv, char *iface);
188 
189 #ifdef DEBUG
190 static void	ng_fec_print_ioctl(struct ifnet *ifp, int cmd, caddr_t data);
191 #endif
192 
193 /* Netgraph methods */
194 static ng_constructor_t	ng_fec_constructor;
195 static ng_rcvmsg_t	ng_fec_rcvmsg;
196 static ng_shutdown_t	ng_fec_rmnode;
197 
198 /* List of commands and how to convert arguments to/from ASCII */
199 static const struct ng_cmdlist ng_fec_cmds[] = {
200 	{
201 	  NGM_FEC_COOKIE,
202 	  NGM_FEC_ADD_IFACE,
203 	  "add_iface",
204 	  &ng_parse_string_type,
205 	  NULL,
206 	},
207 	{
208 	  NGM_FEC_COOKIE,
209 	  NGM_FEC_DEL_IFACE,
210 	  "del_iface",
211 	  &ng_parse_string_type,
212 	  NULL,
213 	},
214 	{
215 	  NGM_FEC_COOKIE,
216 	  NGM_FEC_SET_MODE_MAC,
217 	  "set_mode_mac",
218 	  NULL,
219 	  NULL,
220 	},
221 	{
222 	  NGM_FEC_COOKIE,
223 	  NGM_FEC_SET_MODE_INET,
224 	  "set_mode_inet",
225 	  NULL,
226 	  NULL,
227 	},
228 	{ 0 }
229 };
230 
231 /* Node type descriptor */
232 static struct ng_type typestruct = {
233 	NG_VERSION,
234 	NG_FEC_NODE_TYPE,
235 	NULL,
236 	ng_fec_constructor,
237 	ng_fec_rcvmsg,
238 	ng_fec_rmnode,
239 	NULL,
240 	NULL,
241 	NULL,
242 	NULL,
243 	NULL,
244 	NULL,
245 	ng_fec_cmds
246 };
247 NETGRAPH_INIT(fec, &typestruct);
248 
249 /* We keep a bitmap indicating which unit numbers are free.
250    One means the unit number is free, zero means it's taken. */
251 static int	*ng_fec_units = NULL;
252 static int	ng_fec_units_len = 0;
253 static int	ng_units_in_use = 0;
254 
255 #define UNITS_BITSPERWORD	(sizeof(*ng_fec_units) * NBBY)
256 
257 /*
258  * Find the first free unit number for a new interface.
259  * Increase the size of the unit bitmap as necessary.
260  */
261 static __inline__ int
262 ng_fec_get_unit(int *unit)
263 {
264 	int index, bit;
265 
266 	for (index = 0; index < ng_fec_units_len
267 	    && ng_fec_units[index] == 0; index++);
268 	if (index == ng_fec_units_len) {		/* extend array */
269 		int i, *newarray, newlen;
270 
271 		newlen = (2 * ng_fec_units_len) + 4;
272 		newarray = kmalloc(newlen * sizeof(*ng_fec_units),
273 				   M_NETGRAPH, M_NOWAIT);
274 		if (newarray == NULL)
275 			return (ENOMEM);
276 		bcopy(ng_fec_units, newarray,
277 		    ng_fec_units_len * sizeof(*ng_fec_units));
278 		for (i = ng_fec_units_len; i < newlen; i++)
279 			newarray[i] = ~0;
280 		if (ng_fec_units != NULL)
281 			kfree(ng_fec_units, M_NETGRAPH);
282 		ng_fec_units = newarray;
283 		ng_fec_units_len = newlen;
284 	}
285 	bit = ffs(ng_fec_units[index]) - 1;
286 	KASSERT(bit >= 0 && bit <= UNITS_BITSPERWORD - 1,
287 	    ("%s: word=%d bit=%d", __func__, ng_fec_units[index], bit));
288 	ng_fec_units[index] &= ~(1 << bit);
289 	*unit = (index * UNITS_BITSPERWORD) + bit;
290 	ng_units_in_use++;
291 	return (0);
292 }
293 
294 /*
295  * Free a no longer needed unit number.
296  */
297 static __inline__ void
298 ng_fec_free_unit(int unit)
299 {
300 	int index, bit;
301 
302 	index = unit / UNITS_BITSPERWORD;
303 	bit = unit % UNITS_BITSPERWORD;
304 	KASSERT(index < ng_fec_units_len,
305 	    ("%s: unit=%d len=%d", __func__, unit, ng_fec_units_len));
306 	KASSERT((ng_fec_units[index] & (1 << bit)) == 0,
307 	    ("%s: unit=%d is free", __func__, unit));
308 	ng_fec_units[index] |= (1 << bit);
309 	/*
310 	 * XXX We could think about reducing the size of ng_fec_units[]
311 	 * XXX here if the last portion is all ones
312 	 * XXX At least free it if no more units.
313 	 * Needed if we are eventually be able to unload.
314 	 */
315 	ng_units_in_use++;
316 	if (ng_units_in_use == 0) { /* XXX make SMP safe */
317 		kfree(ng_fec_units, M_NETGRAPH);
318 		ng_fec_units_len = 0;
319 		ng_fec_units = NULL;
320 	}
321 }
322 
323 /************************************************************************
324 			INTERFACE STUFF
325  ************************************************************************/
326 
327 static int
328 ng_fec_addport(struct ng_fec_private *priv, char *iface)
329 {
330 	struct ng_fec_bundle	*b;
331 	struct ifnet		*ifp, *bifp;
332 	struct arpcom		*ac;
333 	struct sockaddr_dl	*sdl;
334 	struct ng_fec_portlist	*p, *new;
335 
336 	if (priv == NULL || iface == NULL)
337 		return(EINVAL);
338 
339 	b = &priv->fec_bundle;
340 	ifp = &priv->arpcom.ac_if;
341 
342 	ifnet_lock();
343 
344 	/* Find the interface */
345 	bifp = ifunit(iface);
346 	if (bifp == NULL) {
347 		ifnet_unlock();
348 		kprintf("fec%d: tried to add iface %s, which "
349 		    "doesn't seem to exist\n", priv->unit, iface);
350 		return(ENOENT);
351 	}
352 
353 	/* See if we have room in the bundle */
354 	if (b->fec_ifcnt == FEC_BUNDLESIZ) {
355 		ifnet_unlock();
356 		kprintf("fec%d: can't add new iface; bundle is full\n",
357 		    priv->unit);
358 		return(ENOSPC);
359 	}
360 
361 	/* See if the interface is already in the bundle */
362 	TAILQ_FOREACH(p, &b->ng_fec_ports, fec_list) {
363 		if (p->fec_if == bifp) {
364 			ifnet_unlock();
365 			kprintf("fec%d: iface %s is already in this "
366 			    "bundle\n", priv->unit, iface);
367 			return(EINVAL);
368 		}
369 	}
370 
371 	/* Allocate new list entry. */
372 	new = kmalloc(sizeof(struct ng_fec_portlist), M_NETGRAPH, M_NOWAIT);
373 	if (new == NULL) {
374 		ifnet_unlock();
375 		return(ENOMEM);
376 	}
377 
378 	ac = (struct arpcom *)bifp;
379 	ac->ac_netgraph = priv->node;
380 
381 	/*
382 	 * If this is the first interface added to the bundle,
383 	 * use its MAC address for the virtual interface (and,
384 	 * by extension, all the other ports in the bundle).
385 	 */
386 	if (b->fec_ifcnt == 0) {
387 		sdl = IF_LLSOCKADDR(ifp);
388 		bcopy((char *)ac->ac_enaddr,
389 		    priv->arpcom.ac_enaddr, ETHER_ADDR_LEN);
390 		bcopy((char *)ac->ac_enaddr,
391 		    LLADDR(sdl), ETHER_ADDR_LEN);
392 	}
393 
394 	b->fec_btype = FEC_BTYPE_MAC;
395 	new->fec_idx = b->fec_ifcnt;
396 	b->fec_ifcnt++;
397 
398 	/* Save the real MAC address. */
399 	bcopy((char *)ac->ac_enaddr,
400 	    (char *)&new->fec_mac, ETHER_ADDR_LEN);
401 
402 	/* Set up phony MAC address. */
403 	sdl = IF_LLSOCKADDR(bifp);
404 	bcopy(priv->arpcom.ac_enaddr, ac->ac_enaddr, ETHER_ADDR_LEN);
405 	bcopy(priv->arpcom.ac_enaddr, LLADDR(sdl), ETHER_ADDR_LEN);
406 
407 	/* Add to the queue */
408 	new->fec_if = bifp;
409 	TAILQ_INSERT_TAIL(&b->ng_fec_ports, new, fec_list);
410 
411 	ifnet_unlock();
412 
413 	return(0);
414 }
415 
416 static int
417 ng_fec_delport(struct ng_fec_private *priv, char *iface)
418 {
419 	struct ng_fec_bundle	*b;
420 	struct ifnet		*bifp;
421 	struct arpcom		*ac;
422 	struct sockaddr_dl	*sdl;
423 	struct ng_fec_portlist	*p;
424 
425 	if (priv == NULL || iface == NULL)
426 		return(EINVAL);
427 
428 	b = &priv->fec_bundle;
429 
430 	ifnet_lock();
431 
432 	/* Find the interface */
433 	bifp = ifunit(iface);
434 	if (bifp == NULL) {
435 		ifnet_unlock();
436 		kprintf("fec%d: tried to remove iface %s, which "
437 		    "doesn't seem to exist\n", priv->unit, iface);
438 		return(ENOENT);
439 	}
440 
441 	TAILQ_FOREACH(p, &b->ng_fec_ports, fec_list) {
442 		if (p->fec_if == bifp)
443 			break;
444 	}
445 
446 	if (p == NULL) {
447 		ifnet_unlock();
448 		kprintf("fec%d: tried to remove iface %s which "
449 		    "is not in our bundle\n", priv->unit, iface);
450 		return(EINVAL);
451 	}
452 
453 	/* Stop interface */
454 	bifp->if_flags &= ~IFF_UP;
455 	bifp->if_ioctl(bifp, SIOCSIFFLAGS, NULL, NULL);
456 
457 	/* Restore MAC address. */
458 	ac = (struct arpcom *)bifp;
459 	sdl = IF_LLSOCKADDR(bifp);
460 	bcopy((char *)&p->fec_mac, ac->ac_enaddr, ETHER_ADDR_LEN);
461 	bcopy((char *)&p->fec_mac, LLADDR(sdl), ETHER_ADDR_LEN);
462 
463 	/* Delete port */
464 	TAILQ_REMOVE(&b->ng_fec_ports, p, fec_list);
465 	kfree(p, M_NETGRAPH);
466 	b->fec_ifcnt--;
467 
468 	ifnet_unlock();
469 
470 	return(0);
471 }
472 
473 /*
474  * Pass an ioctl command down to all the underyling interfaces in a
475  * bundle. Used for setting multicast filters and flags.
476  */
477 static int
478 ng_fec_setport(struct ifnet *ifp, u_long command, caddr_t data)
479 {
480 	struct ng_fec_private	*priv;
481 	struct ng_fec_bundle	*b;
482 	struct ifnet		*oifp;
483 	struct ng_fec_portlist	*p;
484 
485 	priv = ifp->if_softc;
486 	b = &priv->fec_bundle;
487 
488 	ifnet_deserialize_all(ifp);	/* XXX */
489 	TAILQ_FOREACH(p, &b->ng_fec_ports, fec_list) {
490 		oifp = p->fec_if;
491 		if (oifp != NULL) {
492 			ifnet_serialize_all(oifp);
493 			oifp->if_ioctl(oifp, command, data, NULL);
494 			ifnet_deserialize_all(oifp);
495 		}
496 	}
497 	ifnet_serialize_all(ifp);
498 
499 	return(0);
500 }
501 
502 static void
503 ng_fec_init(void *arg)
504 {
505 	struct ng_fec_private	*priv;
506 	struct ng_fec_bundle	*b;
507 	struct ifnet		*ifp, *bifp;
508 	struct ng_fec_portlist	*p;
509 
510 	ifp = arg;
511 	priv = ifp->if_softc;
512 	b = &priv->fec_bundle;
513 
514 	if (b->fec_ifcnt == 1 || b->fec_ifcnt == 3) {
515 		kprintf("fec%d: invalid bundle "
516 		    "size: %d\n", priv->unit,
517 		    b->fec_ifcnt);
518 		return;
519 	}
520 
521 	ng_fec_stop(ifp);
522 
523 	ifnet_deserialize_all(ifp);	/* XXX */
524 	TAILQ_FOREACH(p, &b->ng_fec_ports, fec_list) {
525 		bifp = p->fec_if;
526 		ifnet_serialize_all(bifp);
527 		bifp->if_flags |= IFF_UP;
528                 bifp->if_ioctl(bifp, SIOCSIFFLAGS, NULL, NULL);
529 		/* mark iface as up and let the monitor check it */
530 		p->fec_ifstat = -1;
531 		ifnet_deserialize_all(bifp);
532 	}
533 	ifnet_serialize_all(ifp);
534 
535 	callout_reset(&priv->fec_timeout, hz, ng_fec_tick, priv);
536 }
537 
538 static void
539 ng_fec_stop(struct ifnet *ifp)
540 {
541 	struct ng_fec_private	*priv;
542 	struct ng_fec_bundle	*b;
543 	struct ifnet		*bifp;
544 	struct ng_fec_portlist	*p;
545 
546 	priv = ifp->if_softc;
547 	b = &priv->fec_bundle;
548 
549 	ifnet_deserialize_all(ifp);	/* XXX */
550 	TAILQ_FOREACH(p, &b->ng_fec_ports, fec_list) {
551 		bifp = p->fec_if;
552 		ifnet_serialize_all(bifp);
553 		bifp->if_flags &= ~IFF_UP;
554                 bifp->if_ioctl(bifp, SIOCSIFFLAGS, NULL, NULL);
555 		ifnet_deserialize_all(bifp);
556 	}
557 	ifnet_serialize_all(ifp);
558 
559 	callout_stop(&priv->fec_timeout);
560 }
561 
562 static void
563 ng_fec_tick(void *arg)
564 {
565 	struct ng_fec_private	*priv;
566 	struct ng_fec_bundle	*b;
567         struct ifmediareq	ifmr;
568 	struct ifnet		*ifp;
569 	struct ng_fec_portlist	*p;
570 	int			error = 0;
571 
572 	priv = arg;
573 	b = &priv->fec_bundle;
574 
575 	/*
576 	 * Note: serializer for parent interface not held on entry, and
577 	 * cannot be held during the loop to avoid a deadlock.
578 	 */
579 	TAILQ_FOREACH(p, &b->ng_fec_ports, fec_list) {
580 		bzero((char *)&ifmr, sizeof(ifmr));
581 		ifp = p->fec_if;
582 		ifnet_serialize_all(ifp);
583 		error = ifp->if_ioctl(ifp, SIOCGIFMEDIA, (caddr_t)&ifmr, NULL);
584 		if (error) {
585 			kprintf("fec%d: failed to check status "
586 			    "of link %s\n", priv->unit, ifp->if_xname);
587 			ifnet_deserialize_all(ifp);
588 			continue;
589 		}
590 
591         	if (ifmr.ifm_status & IFM_AVALID &&
592                     IFM_TYPE(ifmr.ifm_active) == IFM_ETHER) {
593 			if (ifmr.ifm_status & IFM_ACTIVE) {
594 				if (p->fec_ifstat == -1 ||
595 				    p->fec_ifstat == 0) {
596 					p->fec_ifstat = 1;
597 					kprintf("fec%d: port %s in bundle "
598 					    "is up\n", priv->unit,
599 					    ifp->if_xname);
600 				}
601 			} else {
602 				if (p->fec_ifstat == -1 ||
603 				    p->fec_ifstat == 1) {
604 					p->fec_ifstat = 0;
605 					kprintf("fec%d: port %s in bundle "
606 					    "is down\n", priv->unit,
607 					    ifp->if_xname);
608 				}
609 			}
610 		}
611 		ifnet_deserialize_all(ifp);
612 	}
613 
614 	ifp = &priv->arpcom.ac_if;
615 	if (ifp->if_flags & IFF_RUNNING)
616 		callout_reset(&priv->fec_timeout, hz, ng_fec_tick, priv);
617 }
618 
619 static int
620 ng_fec_ifmedia_upd(struct ifnet *ifp)
621 {
622 	return(0);
623 }
624 
625 static void
626 ng_fec_ifmedia_sts(struct ifnet *ifp, struct ifmediareq *ifmr)
627 {
628 	struct ng_fec_private	*priv;
629 	struct ng_fec_bundle	*b;
630 	struct ng_fec_portlist	*p;
631 
632 	priv = ifp->if_softc;
633 	b = &priv->fec_bundle;
634 
635 	ifmr->ifm_status = IFM_AVALID;
636 	TAILQ_FOREACH(p, &b->ng_fec_ports, fec_list) {
637 		if (p->fec_ifstat) {
638 			ifmr->ifm_status |= IFM_ACTIVE;
639 			break;
640 		}
641 	}
642 }
643 
644 /*
645  * Process an ioctl for the virtual interface
646  */
647 static int
648 ng_fec_ioctl(struct ifnet *ifp, u_long command, caddr_t data, struct ucred *cr)
649 {
650 	struct ifreq *const ifr = (struct ifreq *) data;
651 	int error = 0;
652 	struct ng_fec_private	*priv;
653 	struct ng_fec_bundle	*b;
654 
655 	priv = ifp->if_softc;
656 	b = &priv->fec_bundle;
657 
658 #ifdef DEBUG
659 	ng_fec_print_ioctl(ifp, command, data);
660 #endif
661 	crit_enter();
662 	switch (command) {
663 
664 	/* These two are mostly handled at a higher layer */
665 	case SIOCSIFADDR:
666 	case SIOCGIFADDR:
667 	case SIOCSIFMTU:
668 		error = ether_ioctl(ifp, command, data);
669 		break;
670 
671 	/* Set flags */
672 	case SIOCSIFFLAGS:
673 		/*
674 		 * If the interface is marked up and stopped, then start it.
675 		 * If it is marked down and running, then stop it.
676 		 */
677 		if (ifr->ifr_flags & IFF_UP) {
678 			if (!(ifp->if_flags & IFF_RUNNING)) {
679 				/* Sanity. */
680 				if (b->fec_ifcnt == 1 || b->fec_ifcnt == 3) {
681 					kprintf("fec%d: invalid bundle "
682 					    "size: %d\n", priv->unit,
683 					    b->fec_ifcnt);
684 					error = EINVAL;
685 					break;
686 				}
687 				ifq_clr_oactive(&ifp->if_snd);
688 				ifp->if_flags |= IFF_RUNNING;
689 				ng_fec_init(ifp);
690 			}
691 			/*
692 			 * Bubble down changes in promisc mode to
693 			 * underlying interfaces.
694 			 */
695 			if ((ifp->if_flags & IFF_PROMISC) !=
696 			    (priv->if_flags & IFF_PROMISC)) {
697 				ng_fec_setport(ifp, command, data);
698 				priv->if_flags = ifp->if_flags;
699 			}
700 		} else {
701 			if (ifp->if_flags & IFF_RUNNING) {
702 				ifp->if_flags &= ~IFF_RUNNING;
703 				ifq_clr_oactive(&ifp->if_snd);
704 			}
705 			ng_fec_stop(ifp);
706 		}
707 		break;
708 
709 	case SIOCADDMULTI:
710 	case SIOCDELMULTI:
711 		ng_fec_setport(ifp, command, data);
712 		error = 0;
713 		break;
714 	case SIOCGIFMEDIA:
715 	case SIOCSIFMEDIA:
716 		error = ifmedia_ioctl(ifp, ifr, &priv->ifmedia, command);
717 		break;
718 	/* Stuff that's not supported */
719 	case SIOCSIFPHYS:
720 		error = EOPNOTSUPP;
721 		break;
722 
723 	default:
724 		error = EINVAL;
725 		break;
726 	}
727 	crit_exit();
728 	return (error);
729 }
730 
731 /*
732  * This routine spies on mbufs passing through ether_input(). If
733  * they come from one of the interfaces that are aggregated into
734  * our bundle, we fix up the ifnet pointer and increment our
735  * packet counters so that it looks like the frames are actually
736  * coming from us.
737  */
738 static void
739 ng_fec_input(struct ifnet *ifp, struct mbuf **m0)
740 {
741 	struct ng_node		*node;
742 	struct ng_fec_private	*priv;
743 	struct ng_fec_bundle	*b;
744 	struct mbuf		*m;
745 	struct ifnet		*bifp;
746 	struct ng_fec_portlist	*p;
747 
748 	/* Sanity check */
749 	if (ifp == NULL || m0 == NULL)
750 		return;
751 
752 	node = IFP2NG(ifp);
753 
754 	/* Sanity check part II */
755 	if (node == NULL)
756 		return;
757 
758 	priv = node->private;
759 	b = &priv->fec_bundle;
760 	bifp = &priv->arpcom.ac_if;
761 
762 	m = *m0;
763 	TAILQ_FOREACH(p, &b->ng_fec_ports, fec_list) {
764 		if (p->fec_if == m->m_pkthdr.rcvif)
765 			break;
766 	}
767 
768 	/* Wasn't meant for us; leave this frame alone. */
769 	if (p == NULL)
770 		return;
771 
772 	/* Pretend this is our frame. */
773 	m->m_pkthdr.rcvif = bifp;
774 	IFNET_STAT_INC(bifp, ipackets, 1);
775 	IFNET_STAT_INC(bifp, ibytes, m->m_pkthdr.len);
776 
777 	if (bifp->if_bpf) {
778 		bpf_gettoken();
779 		if (bifp->if_bpf)
780 			bpf_mtap(bifp->if_bpf, m);
781 		bpf_reltoken();
782 	}
783 }
784 
785 /*
786  * Take a quick peek at the packet and see if it's ok for us to use
787  * the inet or inet6 hash methods on it, if they're enabled. We do
788  * this by setting flags in the mbuf header. Once we've made up our
789  * mind what to do, we pass the frame to ether_output() for further
790  * processing.
791  */
792 
793 static int
794 ng_fec_output_serialized(struct ifnet *ifp, struct mbuf *m,
795 			 struct sockaddr *dst, struct rtentry *rt0)
796 {
797 	const priv_p priv = (priv_p) ifp->if_softc;
798 	struct ng_fec_bundle *b;
799 	int error;
800 
801 	/* Check interface flags */
802 	if ((ifp->if_flags & (IFF_UP|IFF_RUNNING)) != (IFF_UP|IFF_RUNNING)) {
803 		m_freem(m);
804 		return (ENETDOWN);
805 	}
806 
807 	b = &priv->fec_bundle;
808 
809 	switch (b->fec_btype) {
810 	case FEC_BTYPE_MAC:
811 		m->m_flags |= M_FEC_MAC;
812 		break;
813 #ifdef INET
814 	case FEC_BTYPE_INET:
815 		/*
816 		 * We can't use the INET address port selection
817 		 * scheme if this isn't an INET packet.
818 		 */
819 		if (dst->sa_family == AF_INET)
820 			m->m_flags |= M_FEC_INET;
821 #ifdef INET6
822 		else if (dst->sa_family == AF_INET6)
823 			m->m_flags |= M_FEC_INET6;
824 #endif
825 		else {
826 #ifdef DEBUG
827 			kprintf("%s: can't do inet aggregation of non "
828 			    "inet packet\n", ifp->if_xname);
829 #endif
830 			m->m_flags |= M_FEC_MAC;
831 		}
832 		break;
833 #endif
834 	default:
835 		kprintf("%s: bogus hash type: %d\n", ifp->if_xname,
836 		    b->fec_btype);
837 		m_freem(m);
838 		return(EINVAL);
839 		break;
840 	}
841 
842 	/*
843 	 * Pass the frame to ether_output() for all the protocol
844 	 * handling. This will put the ethernet header on the packet
845 	 * for us.
846 	 */
847 	priv->if_error = 0;
848 	error = priv->real_if_output(ifp, m, dst, rt0);
849 	if (priv->if_error && !error)
850 		error = priv->if_error;
851 
852 	return(error);
853 }
854 
855 static int
856 ng_fec_output(struct ifnet *ifp, struct mbuf *m,
857 	      struct sockaddr *dst, struct rtentry *rt0)
858 {
859 	struct ifaltq_subque *ifsq = ifq_get_subq_default(&ifp->if_snd);
860 	int error;
861 
862 	ifsq_serialize_hw(ifsq);
863 	error = ng_fec_output_serialized(ifp, m, dst, rt0);
864 	ifsq_deserialize_hw(ifsq);
865 
866 	return error;
867 }
868 
869 /*
870  * Apply a hash to the source and destination addresses in the packet
871  * in order to select an interface. Also check link status and handle
872  * dead links accordingly.
873  */
874 
875 static int
876 ng_fec_choose_port(struct ng_fec_bundle *b,
877 	struct mbuf *m, struct ifnet **ifp)
878 {
879 	struct ether_header	*eh;
880 	struct mbuf		*m0;
881 #ifdef INET
882 	struct ip		*ip;
883 #ifdef INET6
884 	struct ip6_hdr		*ip6;
885 #endif
886 #endif
887 
888 	struct ng_fec_portlist	*p;
889 	int			port = 0, mask;
890 
891 	/*
892 	 * If there are only two ports, mask off all but the
893 	 * last bit for XORing. If there are 4, mask off all
894 	 * but the last 2 bits.
895 	 */
896 	mask = b->fec_ifcnt == 2 ? 0x1 : 0x3;
897 	eh = mtod(m, struct ether_header *);
898 #ifdef INET
899 	ip = (struct ip *)(mtod(m, char *) +
900 	    sizeof(struct ether_header));
901 #ifdef INET6
902 	ip6 = (struct ip6_hdr *)(mtod(m, char *) +
903 	    sizeof(struct ether_header));
904 #endif
905 #endif
906 
907 	/*
908 	 * The fg_fec_output() routine is supposed to leave a
909 	 * flag for us in the mbuf that tells us what hash to
910 	 * use, but sometimes a new mbuf is prepended to the
911 	 * chain, so we have to search every mbuf in the chain
912 	 * to find the flags.
913 	 */
914 	m0 = m;
915 	while (m0) {
916 		if (m0->m_flags & (M_FEC_MAC|M_FEC_INET|M_FEC_INET6))
917 			break;
918 		m0 = m0->m_next;
919 	}
920 	if (m0 == NULL)
921 		return(EINVAL);
922 
923 	switch (m0->m_flags & (M_FEC_MAC|M_FEC_INET|M_FEC_INET6)) {
924 	case M_FEC_MAC:
925 		port = (eh->ether_dhost[5] ^
926 		    eh->ether_shost[5]) & mask;
927 		break;
928 #ifdef INET
929 	case M_FEC_INET:
930 		port = (ntohl(ip->ip_dst.s_addr) ^
931 		    ntohl(ip->ip_src.s_addr)) & mask;
932 		break;
933 #ifdef INET6
934 	case M_FEC_INET6:
935 		port = (ip6->ip6_dst.s6_addr[15] ^
936 		    ip6->ip6_src.s6_addr[15]) & mask;
937 		break;
938 #endif
939 #endif
940 	default:
941 		return(EINVAL);
942 			break;
943 	}
944 
945 	TAILQ_FOREACH(p, &b->ng_fec_ports, fec_list) {
946 		if (port == p->fec_idx)
947 			break;
948 	}
949 
950 	/*
951 	 * Now that we've chosen a port, make sure it's
952 	 * alive. If it's not alive, cycle through the bundle
953 	 * looking for a port that is alive. If we don't find
954 	 * any, return an error.
955 	 */
956 	if (p->fec_ifstat != 1) {
957 		struct ng_fec_portlist	*n = NULL;
958 
959 		n = TAILQ_NEXT(p, fec_list);
960 		if (n == NULL)
961 			n = TAILQ_FIRST(&b->ng_fec_ports);
962 		while (n != p) {
963 			if (n->fec_ifstat == 1)
964 				break;
965 			n = TAILQ_NEXT(n, fec_list);
966 			if (n == NULL)
967 				n = TAILQ_FIRST(&b->ng_fec_ports);
968 		}
969 		if (n == p)
970 			return(EAGAIN);
971 		p = n;
972 	}
973 
974 	*ifp = p->fec_if;
975 
976 	return(0);
977 }
978 
979 /*
980  * Now that the packet has been run through ether_output(), yank it
981  * off our own send queue and stick it on the queue for the appropriate
982  * underlying physical interface. Note that if the interface's send
983  * queue is full, we save an error status in our private netgraph
984  * space which will eventually be handed up to ng_fec_output(), which
985  * will return it to the rest of the IP stack. We need to do this
986  * in order to duplicate the effect of ether_output() returning ENOBUFS
987  * when it detects that an interface's send queue is full. There's no
988  * other way to signal the error status from here since the if_start()
989  * routine is spec'ed to return void.
990  *
991  * Once the frame is queued, we call ether_output_frame() to initiate
992  * transmission.
993  */
994 static void
995 ng_fec_start(struct ifnet *ifp, struct ifaltq_subque *ifsq __unused)
996 {
997 	struct ng_fec_private	*priv;
998 	struct ng_fec_bundle	*b;
999 	struct ifnet		*oifp = NULL;
1000 	struct mbuf		*m0;
1001 	int			error;
1002 
1003 	priv = ifp->if_softc;
1004 	b = &priv->fec_bundle;
1005 
1006 	m0 = ifq_dequeue(&ifp->if_snd);
1007 	if (m0 == NULL)
1008 		return;
1009 
1010 	BPF_MTAP(ifp, m0);
1011 
1012 	/* Queue up packet on the proper port. */
1013 	error = ng_fec_choose_port(b, m0, &oifp);
1014 	if (error) {
1015 		IFNET_STAT_INC(ifp, ierrors, 1);
1016 		m_freem(m0);
1017 		priv->if_error = ENOBUFS;
1018 		return;
1019 	}
1020 	IFNET_STAT_INC(ifp, opackets, 1);
1021 
1022 	/*
1023 	 * Release current iface's serializer to avoid possible dead lock
1024 	 */
1025 	priv->if_error = ether_output_frame(oifp, m0);
1026 }
1027 
1028 #ifdef DEBUG
1029 /*
1030  * Display an ioctl to the virtual interface
1031  */
1032 
1033 static void
1034 ng_fec_print_ioctl(struct ifnet *ifp, int command, caddr_t data)
1035 {
1036 	char   *str;
1037 
1038 	switch (command & IOC_DIRMASK) {
1039 	case IOC_VOID:
1040 		str = "IO";
1041 		break;
1042 	case IOC_OUT:
1043 		str = "IOR";
1044 		break;
1045 	case IOC_IN:
1046 		str = "IOW";
1047 		break;
1048 	case IOC_INOUT:
1049 		str = "IORW";
1050 		break;
1051 	default:
1052 		str = "IO??";
1053 	}
1054 	log(LOG_DEBUG, "%s: %s('%c', %d, char[%d])\n",
1055 	       ifp->if_xname,
1056 	       str,
1057 	       IOCGROUP(command),
1058 	       command & 0xff,
1059 	       IOCPARM_LEN(command));
1060 }
1061 #endif /* DEBUG */
1062 
1063 /************************************************************************
1064 			NETGRAPH NODE STUFF
1065  ************************************************************************/
1066 
1067 /*
1068  * Constructor for a node
1069  */
1070 static int
1071 ng_fec_constructor(node_p *nodep)
1072 {
1073 	char ifname[NG_FEC_FEC_NAME_MAX + 1];
1074 	struct ifnet *ifp;
1075 	node_p node;
1076 	priv_p priv;
1077 	struct ng_fec_bundle *b;
1078 	int error = 0;
1079 
1080 	/* Allocate node and interface private structures */
1081 	priv = kmalloc(sizeof(*priv), M_NETGRAPH, M_NOWAIT | M_ZERO);
1082 	if (priv == NULL)
1083 		return (ENOMEM);
1084 
1085 	ifp = &priv->arpcom.ac_if;
1086 	b = &priv->fec_bundle;
1087 
1088 	/* Link them together */
1089 	ifp->if_softc = priv;
1090 
1091 	/* Get an interface unit number */
1092 	if ((error = ng_fec_get_unit(&priv->unit)) != 0) {
1093 		kfree(ifp, M_NETGRAPH);
1094 		kfree(priv, M_NETGRAPH);
1095 		return (error);
1096 	}
1097 
1098 	/* Call generic node constructor */
1099 	if ((error = ng_make_node_common(&typestruct, nodep)) != 0) {
1100 		ng_fec_free_unit(priv->unit);
1101 		kfree(ifp, M_NETGRAPH);
1102 		kfree(priv, M_NETGRAPH);
1103 		return (error);
1104 	}
1105 	node = *nodep;
1106 
1107 	/* Link together node and private info */
1108 	node->private = priv;
1109 	priv->node = node;
1110 	priv->arpcom.ac_netgraph = node;
1111 
1112 	/* Initialize interface structure */
1113 	if_initname(ifp, NG_FEC_FEC_NAME, priv->unit);
1114 	ifp->if_start = ng_fec_start;
1115 	ifp->if_ioctl = ng_fec_ioctl;
1116 	ifp->if_init = ng_fec_init;
1117 	ifp->if_watchdog = NULL;
1118 	ifq_set_maxlen(&ifp->if_snd, IFQ_MAXLEN);
1119 	ifp->if_mtu = NG_FEC_MTU_DEFAULT;
1120 	ifp->if_flags = (IFF_SIMPLEX|IFF_BROADCAST|IFF_MULTICAST);
1121 	ifp->if_type = IFT_PROPVIRTUAL;		/* XXX */
1122 	ifp->if_addrlen = 0;			/* XXX */
1123 	ifp->if_hdrlen = 0;			/* XXX */
1124 	ifp->if_baudrate = 100000000;		/* XXX */
1125 
1126 	/* Give this node the same name as the interface (if possible) */
1127 	bzero(ifname, sizeof(ifname));
1128 	strlcpy(ifname, ifp->if_xname, sizeof(ifname));
1129 	if (ng_name_node(node, ifname) != 0)
1130 		log(LOG_WARNING, "%s: can't acquire netgraph name\n", ifname);
1131 
1132 	/* Grab hold of the ether_input pipe. */
1133 	if (ng_ether_input_p == NULL)
1134 		ng_ether_input_p = ng_fec_input;
1135 
1136 	/* Attach the interface */
1137 	ether_ifattach(ifp, priv->arpcom.ac_enaddr, NULL);
1138 	priv->real_if_output = ifp->if_output;
1139 	ifp->if_output = ng_fec_output;
1140 	callout_init(&priv->fec_timeout);
1141 
1142 	TAILQ_INIT(&b->ng_fec_ports);
1143 	b->fec_ifcnt = 0;
1144 
1145 	ifmedia_init(&priv->ifmedia, 0,
1146 	    ng_fec_ifmedia_upd, ng_fec_ifmedia_sts);
1147 	ifmedia_add(&priv->ifmedia, IFM_ETHER|IFM_NONE, 0, NULL);
1148 	ifmedia_set(&priv->ifmedia, IFM_ETHER|IFM_NONE);
1149 
1150 	/* Done */
1151 	return (0);
1152 }
1153 
1154 /*
1155  * Receive a control message
1156  */
1157 static int
1158 ng_fec_rcvmsg(node_p node, struct ng_mesg *msg,
1159 		const char *retaddr, struct ng_mesg **rptr)
1160 {
1161 	const priv_p priv = node->private;
1162 	struct ng_fec_bundle	*b;
1163 	struct ng_mesg *resp = NULL;
1164 	char *ifname;
1165 	int error = 0;
1166 
1167 	b = &priv->fec_bundle;
1168 
1169 	switch (msg->header.typecookie) {
1170 	case NGM_FEC_COOKIE:
1171 		switch (msg->header.cmd) {
1172 		case NGM_FEC_ADD_IFACE:
1173 			ifname = msg->data;
1174 			error = ng_fec_addport(priv, ifname);
1175 			break;
1176 		case NGM_FEC_DEL_IFACE:
1177 			ifname = msg->data;
1178 			error = ng_fec_delport(priv, ifname);
1179 			break;
1180 		case NGM_FEC_SET_MODE_MAC:
1181 			b->fec_btype = FEC_BTYPE_MAC;
1182 			break;
1183 #ifdef INET
1184 		case NGM_FEC_SET_MODE_INET:
1185 			b->fec_btype = FEC_BTYPE_INET;
1186 			break;
1187 #ifdef INET6
1188 		case NGM_FEC_SET_MODE_INET6:
1189 			b->fec_btype = FEC_BTYPE_INET6;
1190 			break;
1191 #endif
1192 #endif
1193 		default:
1194 			error = EINVAL;
1195 			break;
1196 		}
1197 		break;
1198 	default:
1199 		error = EINVAL;
1200 		break;
1201 	}
1202 	if (rptr)
1203 		*rptr = resp;
1204 	else if (resp)
1205 		kfree(resp, M_NETGRAPH);
1206 	kfree(msg, M_NETGRAPH);
1207 	return (error);
1208 }
1209 
1210 /*
1211  * Shutdown and remove the node and its associated interface.
1212  */
1213 static int
1214 ng_fec_rmnode(node_p node)
1215 {
1216 	const priv_p priv = node->private;
1217 	struct ng_fec_bundle *b;
1218 	struct ng_fec_portlist	*p;
1219 	char ifname[IFNAMSIZ];
1220 
1221 	b = &priv->fec_bundle;
1222 	ng_fec_stop(&priv->arpcom.ac_if);
1223 
1224 	while (!TAILQ_EMPTY(&b->ng_fec_ports)) {
1225 		p = TAILQ_FIRST(&b->ng_fec_ports);
1226 		ksprintf(ifname, "%s",
1227 		    p->fec_if->if_xname); /* XXX: strings */
1228 		ng_fec_delport(priv, ifname);
1229 	}
1230 
1231 	ng_cutlinks(node);
1232 	ng_unname(node);
1233 	if (ng_ether_input_p != NULL)
1234 		ng_ether_input_p = NULL;
1235 	ether_ifdetach(&priv->arpcom.ac_if);
1236 	ifmedia_removeall(&priv->ifmedia);
1237 	ng_fec_free_unit(priv->unit);
1238 	kfree(priv, M_NETGRAPH);
1239 	node->private = NULL;
1240 	ng_unref(node);
1241 	return (0);
1242 }
1243