xref: /dragonfly/sys/netgraph/fec/ng_fec.c (revision 984263bc)
1 /*
2  * ng_fec.c
3  *
4  * Copyright (c) 2001 Berkeley Software Design, Inc.
5  * Copyright (c) 2000, 2001
6  *	Bill Paul <wpaul@osd.bsdi.com>.  All rights reserved.
7  *
8  * Redistribution and use in source and binary forms, with or without
9  * modification, are permitted provided that the following conditions
10  * are met:
11  * 1. Redistributions of source code must retain the above copyright
12  *    notice, this list of conditions and the following disclaimer.
13  * 2. Redistributions in binary form must reproduce the above copyright
14  *    notice, this list of conditions and the following disclaimer in the
15  *    documentation and/or other materials provided with the distribution.
16  * 3. All advertising materials mentioning features or use of this software
17  *    must display the following acknowledgement:
18  *	This product includes software developed by Bill Paul.
19  * 4. Neither the name of the author nor the names of any co-contributors
20  *    may be used to endorse or promote products derived from this software
21  *    without specific prior written permission.
22  *
23  * THIS SOFTWARE IS PROVIDED BY Bill Paul AND CONTRIBUTORS ``AS IS'' AND
24  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
25  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
26  * ARE DISCLAIMED.  IN NO EVENT SHALL Bill Paul OR THE VOICES IN HIS HEAD
27  * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
28  * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
29  * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
30  * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
31  * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
32  * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF
33  * THE POSSIBILITY OF SUCH DAMAGE.
34  *
35  * $FreeBSD: src/sys/netgraph/ng_fec.c,v 1.1.2.1 2002/11/01 21:39:31 julian Exp $
36  */
37 /*
38  * Copyright (c) 1996-1999 Whistle Communications, Inc.
39  * All rights reserved.
40  *
41  * Subject to the following obligations and disclaimer of warranty, use and
42  * redistribution of this software, in source or object code forms, with or
43  * without modifications are expressly permitted by Whistle Communications;
44  * provided, however, that:
45  * 1. Any and all reproductions of the source or object code must include the
46  *    copyright notice above and the following disclaimer of warranties; and
47  * 2. No rights are granted, in any manner or form, to use Whistle
48  *    Communications, Inc. trademarks, including the mark "WHISTLE
49  *    COMMUNICATIONS" on advertising, endorsements, or otherwise except as
50  *    such appears in the above copyright notice or in the software.
51  *
52  * THIS SOFTWARE IS BEING PROVIDED BY WHISTLE COMMUNICATIONS "AS IS", AND
53  * TO THE MAXIMUM EXTENT PERMITTED BY LAW, WHISTLE COMMUNICATIONS MAKES NO
54  * REPRESENTATIONS OR WARRANTIES, EXPRESS OR IMPLIED, REGARDING THIS SOFTWARE,
55  * INCLUDING WITHOUT LIMITATION, ANY AND ALL IMPLIED WARRANTIES OF
56  * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE, OR NON-INFRINGEMENT.
57  * WHISTLE COMMUNICATIONS DOES NOT WARRANT, GUARANTEE, OR MAKE ANY
58  * REPRESENTATIONS REGARDING THE USE OF, OR THE RESULTS OF THE USE OF THIS
59  * SOFTWARE IN TERMS OF ITS CORRECTNESS, ACCURACY, RELIABILITY OR OTHERWISE.
60  * IN NO EVENT SHALL WHISTLE COMMUNICATIONS BE LIABLE FOR ANY DAMAGES
61  * RESULTING FROM OR ARISING OUT OF ANY USE OF THIS SOFTWARE, INCLUDING
62  * WITHOUT LIMITATION, ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY,
63  * PUNITIVE, OR CONSEQUENTIAL DAMAGES, PROCUREMENT OF SUBSTITUTE GOODS OR
64  * SERVICES, LOSS OF USE, DATA OR PROFITS, HOWEVER CAUSED AND UNDER ANY
65  * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
66  * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF
67  * THIS SOFTWARE, EVEN IF WHISTLE COMMUNICATIONS IS ADVISED OF THE POSSIBILITY
68  * OF SUCH DAMAGE.
69  *
70  * Author: Archie Cobbs <archie@freebsd.org>
71  *
72  * $Whistle: ng_fec.c,v 1.33 1999/11/01 09:24:51 julian Exp $
73  */
74 
75 /*
76  * This module implements ethernet channel bonding using the Cisco
77  * Fast EtherChannel mechanism. Two or four ports may be combined
78  * into a single aggregate interface.
79  *
80  * Interfaces are named fec0, fec1, etc.  New nodes take the
81  * first available interface name.
82  *
83  * This node also includes Berkeley packet filter support.
84  *
85  * Note that this node doesn't need to connect to any other
86  * netgraph nodes in order to do its work.
87  */
88 
89 #include <sys/param.h>
90 #include <sys/systm.h>
91 #include <sys/errno.h>
92 #include <sys/kernel.h>
93 #include <sys/malloc.h>
94 #include <sys/mbuf.h>
95 #include <sys/errno.h>
96 #include <sys/sockio.h>
97 #include <sys/socket.h>
98 #include <sys/syslog.h>
99 #include <sys/libkern.h>
100 #include <sys/queue.h>
101 
102 #include <net/if.h>
103 #include <net/if_types.h>
104 #include <net/if_arp.h>
105 #include <net/if_dl.h>
106 #include <net/if_media.h>
107 #include <net/intrq.h>
108 #include <net/bpf.h>
109 #include <net/ethernet.h>
110 
111 #include "opt_inet.h"
112 #include "opt_inet6.h"
113 
114 #include <netinet/in.h>
115 #ifdef INET
116 #include <netinet/in_systm.h>
117 #include <netinet/ip.h>
118 #endif
119 
120 #ifdef INET6
121 #include <netinet/ip6.h>
122 #endif
123 
124 #include <netgraph/ng_message.h>
125 #include <netgraph/netgraph.h>
126 #include <netgraph/ng_parse.h>
127 #include <netgraph/ng_fec.h>
128 
129 #define IFP2NG(ifp)  ((struct ng_node *)((struct arpcom *)(ifp))->ac_netgraph)
130 #define FEC_INC(x, y)	(x) = (x + 1) % y
131 
132 /*
133  * Current fast etherchannel implementations use either 2 or 4
134  * ports, so for now we limit the maximum bundle size to 4 interfaces.
135  */
136 #define FEC_BUNDLESIZ	4
137 
138 struct ng_fec_portlist {
139 	struct ifnet		*fec_if;
140 	int			fec_idx;
141 	int			fec_ifstat;
142 	struct ether_addr	fec_mac;
143 	TAILQ_ENTRY(ng_fec_portlist) fec_list;
144 };
145 
146 struct ng_fec_bundle {
147 	TAILQ_HEAD(,ng_fec_portlist) ng_fec_ports;
148 	int			fec_ifcnt;
149 	int			fec_btype;
150 };
151 
152 #define FEC_BTYPE_MAC		0x01
153 #define FEC_BTYPE_INET		0x02
154 #define FEC_BTYPE_INET6		0x03
155 
156 /* Node private data */
157 struct ng_fec_private {
158 	struct arpcom arpcom;
159 	struct ifmedia ifmedia;
160 	int	if_flags;
161 	int	if_error;		/* XXX */
162 	int	unit;			/* Interface unit number */
163 	node_p	node;			/* Our netgraph node */
164 	struct ng_fec_bundle fec_bundle;/* Aggregate bundle */
165 	struct callout_handle fec_ch;	/* callout handle for ticker */
166 };
167 typedef struct ng_fec_private *priv_p;
168 
169 /* Interface methods */
170 static void	ng_fec_input(struct ifnet *, struct mbuf **,
171 			struct ether_header *);
172 static void	ng_fec_start(struct ifnet *ifp);
173 static int	ng_fec_choose_port(struct ng_fec_bundle *b,
174 			struct mbuf *m, struct ifnet **ifp);
175 static int	ng_fec_setport(struct ifnet *ifp, u_long cmd, caddr_t data);
176 static void	ng_fec_init(void *arg);
177 static void	ng_fec_stop(struct ifnet *ifp);
178 static int	ng_fec_ifmedia_upd(struct ifnet *ifp);
179 static void	ng_fec_ifmedia_sts(struct ifnet *ifp, struct ifmediareq *ifmr);
180 static int	ng_fec_ioctl(struct ifnet *ifp, u_long cmd, caddr_t data);
181 static int	ng_fec_output(struct ifnet *ifp, struct mbuf *m0,
182 			struct sockaddr *dst, struct rtentry *rt0);
183 static void	ng_fec_tick(void *arg);
184 static int	ng_fec_addport(struct ng_fec_private *priv, char *iface);
185 static int	ng_fec_delport(struct ng_fec_private *priv, char *iface);
186 
187 #ifdef DEBUG
188 static void	ng_fec_print_ioctl(struct ifnet *ifp, int cmd, caddr_t data);
189 #endif
190 
191 /* Netgraph methods */
192 static ng_constructor_t	ng_fec_constructor;
193 static ng_rcvmsg_t	ng_fec_rcvmsg;
194 static ng_shutdown_t	ng_fec_rmnode;
195 
196 /* List of commands and how to convert arguments to/from ASCII */
197 static const struct ng_cmdlist ng_fec_cmds[] = {
198 	{
199 	  NGM_FEC_COOKIE,
200 	  NGM_FEC_ADD_IFACE,
201 	  "add_iface",
202 	  &ng_parse_string_type,
203 	  NULL,
204 	},
205 	{
206 	  NGM_FEC_COOKIE,
207 	  NGM_FEC_DEL_IFACE,
208 	  "del_iface",
209 	  &ng_parse_string_type,
210 	  NULL,
211 	},
212 	{
213 	  NGM_FEC_COOKIE,
214 	  NGM_FEC_SET_MODE_MAC,
215 	  "set_mode_mac",
216 	  NULL,
217 	  NULL,
218 	},
219 	{
220 	  NGM_FEC_COOKIE,
221 	  NGM_FEC_SET_MODE_INET,
222 	  "set_mode_inet",
223 	  NULL,
224 	  NULL,
225 	},
226 	{ 0 }
227 };
228 
229 /* Node type descriptor */
230 static struct ng_type typestruct = {
231 	NG_VERSION,
232 	NG_FEC_NODE_TYPE,
233 	NULL,
234 	ng_fec_constructor,
235 	ng_fec_rcvmsg,
236 	ng_fec_rmnode,
237 	NULL,
238 	NULL,
239 	NULL,
240 	NULL,
241 	NULL,
242 	NULL,
243 	ng_fec_cmds
244 };
245 NETGRAPH_INIT(fec, &typestruct);
246 
247 /* We keep a bitmap indicating which unit numbers are free.
248    One means the unit number is free, zero means it's taken. */
249 static int	*ng_fec_units = NULL;
250 static int	ng_fec_units_len = 0;
251 static int	ng_units_in_use = 0;
252 
253 #define UNITS_BITSPERWORD	(sizeof(*ng_fec_units) * NBBY)
254 
255 /*
256  * Find the first free unit number for a new interface.
257  * Increase the size of the unit bitmap as necessary.
258  */
259 static __inline__ int
260 ng_fec_get_unit(int *unit)
261 {
262 	int index, bit;
263 
264 	for (index = 0; index < ng_fec_units_len
265 	    && ng_fec_units[index] == 0; index++);
266 	if (index == ng_fec_units_len) {		/* extend array */
267 		int i, *newarray, newlen;
268 
269 		newlen = (2 * ng_fec_units_len) + 4;
270 		MALLOC(newarray, int *, newlen * sizeof(*ng_fec_units),
271 		    M_NETGRAPH, M_NOWAIT);
272 		if (newarray == NULL)
273 			return (ENOMEM);
274 		bcopy(ng_fec_units, newarray,
275 		    ng_fec_units_len * sizeof(*ng_fec_units));
276 		for (i = ng_fec_units_len; i < newlen; i++)
277 			newarray[i] = ~0;
278 		if (ng_fec_units != NULL)
279 			FREE(ng_fec_units, M_NETGRAPH);
280 		ng_fec_units = newarray;
281 		ng_fec_units_len = newlen;
282 	}
283 	bit = ffs(ng_fec_units[index]) - 1;
284 	KASSERT(bit >= 0 && bit <= UNITS_BITSPERWORD - 1,
285 	    ("%s: word=%d bit=%d", __FUNCTION__, ng_fec_units[index], bit));
286 	ng_fec_units[index] &= ~(1 << bit);
287 	*unit = (index * UNITS_BITSPERWORD) + bit;
288 	ng_units_in_use++;
289 	return (0);
290 }
291 
292 /*
293  * Free a no longer needed unit number.
294  */
295 static __inline__ void
296 ng_fec_free_unit(int unit)
297 {
298 	int index, bit;
299 
300 	index = unit / UNITS_BITSPERWORD;
301 	bit = unit % UNITS_BITSPERWORD;
302 	KASSERT(index < ng_fec_units_len,
303 	    ("%s: unit=%d len=%d", __FUNCTION__, unit, ng_fec_units_len));
304 	KASSERT((ng_fec_units[index] & (1 << bit)) == 0,
305 	    ("%s: unit=%d is free", __FUNCTION__, unit));
306 	ng_fec_units[index] |= (1 << bit);
307 	/*
308 	 * XXX We could think about reducing the size of ng_fec_units[]
309 	 * XXX here if the last portion is all ones
310 	 * XXX At least free it if no more units.
311 	 * Needed if we are eventually be able to unload.
312 	 */
313 	ng_units_in_use++;
314 	if (ng_units_in_use == 0) { /* XXX make SMP safe */
315 		FREE(ng_fec_units, M_NETGRAPH);
316 		ng_fec_units_len = 0;
317 		ng_fec_units = NULL;
318 	}
319 }
320 
321 /************************************************************************
322 			INTERFACE STUFF
323  ************************************************************************/
324 
325 static int
326 ng_fec_addport(struct ng_fec_private *priv, char *iface)
327 {
328 	struct ng_fec_bundle	*b;
329 	struct ifnet		*ifp, *bifp;
330 	struct arpcom		*ac;
331 	struct ifaddr		*ifa;
332 	struct sockaddr_dl	*sdl;
333 	struct ng_fec_portlist	*p, *new;
334 
335 	if (priv == NULL || iface == NULL)
336 		return(EINVAL);
337 
338 	b = &priv->fec_bundle;
339 	ifp = &priv->arpcom.ac_if;
340 
341 	/* Find the interface */
342 	bifp = ifunit(iface);
343 	if (bifp == NULL) {
344 		printf("fec%d: tried to add iface %s, which "
345 		    "doesn't seem to exist\n", priv->unit, iface);
346 		return(ENOENT);
347 	}
348 
349 	/* See if we have room in the bundle */
350 	if (b->fec_ifcnt == FEC_BUNDLESIZ) {
351 		printf("fec%d: can't add new iface; bundle is full\n",
352 		    priv->unit);
353 		return(ENOSPC);
354 	}
355 
356 	/* See if the interface is already in the bundle */
357 	TAILQ_FOREACH(p, &b->ng_fec_ports, fec_list) {
358 		if (p->fec_if == bifp) {
359 			printf("fec%d: iface %s is already in this "
360 			    "bundle\n", priv->unit, iface);
361 			return(EINVAL);
362 		}
363 	}
364 
365 	/* Allocate new list entry. */
366 	MALLOC(new, struct ng_fec_portlist *,
367 	    sizeof(struct ng_fec_portlist), M_NETGRAPH, M_NOWAIT);
368 	if (new == NULL)
369 		return(ENOMEM);
370 
371 	ac = (struct arpcom *)bifp;
372 	ac->ac_netgraph = priv->node;
373 
374 	/*
375 	 * If this is the first interface added to the bundle,
376 	 * use its MAC address for the virtual interface (and,
377 	 * by extension, all the other ports in the bundle).
378 	 */
379 	if (b->fec_ifcnt == 0) {
380 		ifa = ifnet_addrs[ifp->if_index - 1];
381 		sdl = (struct sockaddr_dl *)ifa->ifa_addr;
382 		bcopy((char *)ac->ac_enaddr,
383 		    priv->arpcom.ac_enaddr, ETHER_ADDR_LEN);
384 		bcopy((char *)ac->ac_enaddr,
385 		    LLADDR(sdl), ETHER_ADDR_LEN);
386 	}
387 
388 	b->fec_btype = FEC_BTYPE_MAC;
389 	new->fec_idx = b->fec_ifcnt;
390 	b->fec_ifcnt++;
391 
392 	/* Save the real MAC address. */
393 	bcopy((char *)ac->ac_enaddr,
394 	    (char *)&new->fec_mac, ETHER_ADDR_LEN);
395 
396 	/* Set up phony MAC address. */
397 	ifa = ifnet_addrs[bifp->if_index - 1];
398 	sdl = (struct sockaddr_dl *)ifa->ifa_addr;
399 	bcopy(priv->arpcom.ac_enaddr, ac->ac_enaddr, ETHER_ADDR_LEN);
400 	bcopy(priv->arpcom.ac_enaddr, LLADDR(sdl), ETHER_ADDR_LEN);
401 
402 	/* Add to the queue */
403 	new->fec_if = bifp;
404 	TAILQ_INSERT_TAIL(&b->ng_fec_ports, new, fec_list);
405 
406 	return(0);
407 }
408 
409 static int
410 ng_fec_delport(struct ng_fec_private *priv, char *iface)
411 {
412 	struct ng_fec_bundle	*b;
413 	struct ifnet		*ifp, *bifp;
414 	struct arpcom		*ac;
415 	struct ifaddr		*ifa;
416 	struct sockaddr_dl	*sdl;
417 	struct ng_fec_portlist	*p;
418 
419 	if (priv == NULL || iface == NULL)
420 		return(EINVAL);
421 
422 	b = &priv->fec_bundle;
423 	ifp = &priv->arpcom.ac_if;
424 
425 	/* Find the interface */
426 	bifp = ifunit(iface);
427 	if (bifp == NULL) {
428 		printf("fec%d: tried to remove iface %s, which "
429 		    "doesn't seem to exist\n", priv->unit, iface);
430 		return(ENOENT);
431 	}
432 
433 	TAILQ_FOREACH(p, &b->ng_fec_ports, fec_list) {
434 		if (p->fec_if == bifp)
435 			break;
436 	}
437 
438 	if (p == NULL) {
439 		printf("fec%d: tried to remove iface %s which "
440 		    "is not in our bundle\n", priv->unit, iface);
441 		return(EINVAL);
442 	}
443 
444 	/* Stop interface */
445 	bifp->if_flags &= ~IFF_UP;
446 	(*bifp->if_ioctl)(bifp, SIOCSIFFLAGS, NULL);
447 
448 	/* Restore MAC address. */
449 	ac = (struct arpcom *)bifp;
450 	ifa = ifnet_addrs[bifp->if_index - 1];
451 	sdl = (struct sockaddr_dl *)ifa->ifa_addr;
452 	bcopy((char *)&p->fec_mac, ac->ac_enaddr, ETHER_ADDR_LEN);
453 	bcopy((char *)&p->fec_mac, LLADDR(sdl), ETHER_ADDR_LEN);
454 
455 	/* Delete port */
456 	TAILQ_REMOVE(&b->ng_fec_ports, p, fec_list);
457 	FREE(p, M_NETGRAPH);
458 	b->fec_ifcnt--;
459 
460 	return(0);
461 }
462 
463 /*
464  * Pass an ioctl command down to all the underyling interfaces in a
465  * bundle. Used for setting multicast filters and flags.
466  */
467 
468 static int
469 ng_fec_setport(struct ifnet *ifp, u_long command, caddr_t data)
470 {
471 	struct ng_fec_private	*priv;
472 	struct ng_fec_bundle	*b;
473 	struct ifnet		*oifp;
474 	struct ng_fec_portlist	*p;
475 
476 	priv = ifp->if_softc;
477 	b = &priv->fec_bundle;
478 
479 	TAILQ_FOREACH(p, &b->ng_fec_ports, fec_list) {
480 		oifp = p->fec_if;
481 		if (oifp != NULL)
482 			(*oifp->if_ioctl)(oifp, command, data);
483 	}
484 
485 	return(0);
486 }
487 
488 static void
489 ng_fec_init(void *arg)
490 {
491 	struct ng_fec_private	*priv;
492 	struct ng_fec_bundle	*b;
493 	struct ifnet		*ifp, *bifp;
494 	struct ng_fec_portlist	*p;
495 
496 	ifp = arg;
497 	priv = ifp->if_softc;
498 	b = &priv->fec_bundle;
499 
500 	if (b->fec_ifcnt == 1 || b->fec_ifcnt == 3) {
501 		printf("fec%d: invalid bundle "
502 		    "size: %d\n", priv->unit,
503 		    b->fec_ifcnt);
504 		return;
505 	}
506 
507 	ng_fec_stop(ifp);
508 
509 	TAILQ_FOREACH(p, &b->ng_fec_ports, fec_list) {
510 		bifp = p->fec_if;
511 		bifp->if_flags |= IFF_UP;
512                 (*bifp->if_ioctl)(bifp, SIOCSIFFLAGS, NULL);
513 		/* mark iface as up and let the monitor check it */
514 		p->fec_ifstat = -1;
515 	}
516 
517 	priv->fec_ch = timeout(ng_fec_tick, priv, hz);
518 
519 	return;
520 }
521 
522 static void
523 ng_fec_stop(struct ifnet *ifp)
524 {
525 	struct ng_fec_private	*priv;
526 	struct ng_fec_bundle	*b;
527 	struct ifnet		*bifp;
528 	struct ng_fec_portlist	*p;
529 
530 	priv = ifp->if_softc;
531 	b = &priv->fec_bundle;
532 
533 	TAILQ_FOREACH(p, &b->ng_fec_ports, fec_list) {
534 		bifp = p->fec_if;
535 		bifp->if_flags &= ~IFF_UP;
536                 (*bifp->if_ioctl)(bifp, SIOCSIFFLAGS, NULL);
537 	}
538 
539 	untimeout(ng_fec_tick, priv, priv->fec_ch);
540 
541 	return;
542 }
543 
544 static void
545 ng_fec_tick(void *arg)
546 {
547 	struct ng_fec_private	*priv;
548 	struct ng_fec_bundle	*b;
549         struct ifmediareq	ifmr;
550 	struct ifnet		*ifp;
551 	struct ng_fec_portlist	*p;
552 	int			error = 0;
553 
554 	priv = arg;
555 	b = &priv->fec_bundle;
556 
557 	TAILQ_FOREACH(p, &b->ng_fec_ports, fec_list) {
558 		bzero((char *)&ifmr, sizeof(ifmr));
559 		ifp = p->fec_if;
560 		error = (*ifp->if_ioctl)(ifp, SIOCGIFMEDIA, (caddr_t)&ifmr);
561 		if (error) {
562 			printf("fec%d: failed to check status "
563 			    "of link %s%d\n", priv->unit, ifp->if_name,
564 			    ifp->if_unit);
565 			continue;
566 		}
567 
568         	if (ifmr.ifm_status & IFM_AVALID &&
569                     IFM_TYPE(ifmr.ifm_active) == IFM_ETHER) {
570 			if (ifmr.ifm_status & IFM_ACTIVE) {
571 				if (p->fec_ifstat == -1 ||
572 				    p->fec_ifstat == 0) {
573 					p->fec_ifstat = 1;
574 					printf("fec%d: port %s%d in bundle "
575 					    "is up\n", priv->unit,
576 					    ifp->if_name, ifp->if_unit);
577 				}
578 			} else {
579 				if (p->fec_ifstat == -1 ||
580 				    p->fec_ifstat == 1) {
581 					p->fec_ifstat = 0;
582 					printf("fec%d: port %s%d in bundle "
583 					    "is down\n", priv->unit,
584 					    ifp->if_name, ifp->if_unit);
585 				}
586 			}
587 		}
588 	}
589 
590 	ifp = &priv->arpcom.ac_if;
591 	if (ifp->if_flags & IFF_RUNNING)
592 		priv->fec_ch = timeout(ng_fec_tick, priv, hz);
593 
594 	return;
595 }
596 
597 static int
598 ng_fec_ifmedia_upd(struct ifnet *ifp)
599 {
600 	return(0);
601 }
602 
603 static void ng_fec_ifmedia_sts(struct ifnet *ifp,
604 	struct ifmediareq *ifmr)
605 {
606 	struct ng_fec_private	*priv;
607 	struct ng_fec_bundle	*b;
608 	struct ng_fec_portlist	*p;
609 
610 	priv = ifp->if_softc;
611 	b = &priv->fec_bundle;
612 
613 	ifmr->ifm_status = IFM_AVALID;
614 	TAILQ_FOREACH(p, &b->ng_fec_ports, fec_list) {
615 		if (p->fec_ifstat) {
616 			ifmr->ifm_status |= IFM_ACTIVE;
617 			break;
618 		}
619 	}
620 
621 	return;
622 }
623 
624 /*
625  * Process an ioctl for the virtual interface
626  */
627 static int
628 ng_fec_ioctl(struct ifnet *ifp, u_long command, caddr_t data)
629 {
630 	struct ifreq *const ifr = (struct ifreq *) data;
631 	int s, error = 0;
632 	struct ng_fec_private	*priv;
633 	struct ng_fec_bundle	*b;
634 
635 	priv = ifp->if_softc;
636 	b = &priv->fec_bundle;
637 
638 #ifdef DEBUG
639 	ng_fec_print_ioctl(ifp, command, data);
640 #endif
641 	s = splimp();
642 	switch (command) {
643 
644 	/* These two are mostly handled at a higher layer */
645 	case SIOCSIFADDR:
646 	case SIOCGIFADDR:
647 	case SIOCSIFMTU:
648 		error = ether_ioctl(ifp, command, data);
649 		break;
650 
651 	/* Set flags */
652 	case SIOCSIFFLAGS:
653 		/*
654 		 * If the interface is marked up and stopped, then start it.
655 		 * If it is marked down and running, then stop it.
656 		 */
657 		if (ifr->ifr_flags & IFF_UP) {
658 			if (!(ifp->if_flags & IFF_RUNNING)) {
659 				/* Sanity. */
660 				if (b->fec_ifcnt == 1 || b->fec_ifcnt == 3) {
661 					printf("fec%d: invalid bundle "
662 					    "size: %d\n", priv->unit,
663 					    b->fec_ifcnt);
664 					error = EINVAL;
665 					break;
666 				}
667 				ifp->if_flags &= ~(IFF_OACTIVE);
668 				ifp->if_flags |= IFF_RUNNING;
669 				ng_fec_init(ifp);
670 			}
671 			/*
672 			 * Bubble down changes in promisc mode to
673 			 * underlying interfaces.
674 			 */
675 			if ((ifp->if_flags & IFF_PROMISC) !=
676 			    (priv->if_flags & IFF_PROMISC)) {
677 				ng_fec_setport(ifp, command, data);
678 				priv->if_flags = ifp->if_flags;
679 			}
680 		} else {
681 			if (ifp->if_flags & IFF_RUNNING)
682 				ifp->if_flags &= ~(IFF_RUNNING | IFF_OACTIVE);
683 			ng_fec_stop(ifp);
684 		}
685 		break;
686 
687 	case SIOCADDMULTI:
688 	case SIOCDELMULTI:
689 		ng_fec_setport(ifp, command, data);
690 		error = 0;
691 		break;
692 	case SIOCGIFMEDIA:
693 	case SIOCSIFMEDIA:
694 		error = ifmedia_ioctl(ifp, ifr, &priv->ifmedia, command);
695 		break;
696 	/* Stuff that's not supported */
697 	case SIOCSIFPHYS:
698 		error = EOPNOTSUPP;
699 		break;
700 
701 	default:
702 		error = EINVAL;
703 		break;
704 	}
705 	(void) splx(s);
706 	return (error);
707 }
708 
709 /*
710  * This routine spies on mbufs passing through ether_input(). If
711  * they come from one of the interfaces that are aggregated into
712  * our bundle, we fix up the ifnet pointer and increment our
713  * packet counters so that it looks like the frames are actually
714  * coming from us.
715  */
716 static void
717 ng_fec_input(struct ifnet *ifp, struct mbuf **m0,
718 		struct ether_header *eh)
719 {
720 	struct ng_node		*node;
721 	struct ng_fec_private	*priv;
722 	struct ng_fec_bundle	*b;
723 	struct mbuf		*m;
724 	struct ifnet		*bifp;
725 	struct ng_fec_portlist	*p;
726 
727 	/* Sanity check */
728 	if (ifp == NULL || m0 == NULL || eh == NULL)
729 		return;
730 
731 	node = IFP2NG(ifp);
732 
733 	/* Sanity check part II */
734 	if (node == NULL)
735 		return;
736 
737 	priv = node->private;
738 	b = &priv->fec_bundle;
739 	bifp = &priv->arpcom.ac_if;
740 
741 	m = *m0;
742 	TAILQ_FOREACH(p, &b->ng_fec_ports, fec_list) {
743 		if (p->fec_if == m->m_pkthdr.rcvif)
744 			break;
745 	}
746 
747 	/* Wasn't meant for us; leave this frame alone. */
748 	if (p == NULL)
749 		return;
750 
751 	/* Pretend this is our frame. */
752 	m->m_pkthdr.rcvif = bifp;
753 	bifp->if_ipackets++;
754 	bifp->if_ibytes += m->m_pkthdr.len + sizeof(struct ether_header);
755 
756         /* Check for a BPF tap */
757 	if (bifp->if_bpf != NULL) {
758 		struct m_hdr mh;
759 
760 		/* This kludge is OK; BPF treats the "mbuf" as read-only */
761 		mh.mh_next = m;
762 		mh.mh_data = (char *)eh;
763 		mh.mh_len = ETHER_HDR_LEN;
764 		bpf_mtap(bifp, (struct mbuf *)&mh);
765 	}
766 
767 	return;
768 }
769 
770 /*
771  * Take a quick peek at the packet and see if it's ok for us to use
772  * the inet or inet6 hash methods on it, if they're enabled. We do
773  * this by setting flags in the mbuf header. Once we've made up our
774  * mind what to do, we pass the frame to ether_output() for further
775  * processing.
776  */
777 
778 static int
779 ng_fec_output(struct ifnet *ifp, struct mbuf *m,
780 		struct sockaddr *dst, struct rtentry *rt0)
781 {
782 	const priv_p priv = (priv_p) ifp->if_softc;
783 	struct ng_fec_bundle *b;
784 	int error;
785 
786 	/* Check interface flags */
787 	if ((ifp->if_flags & (IFF_UP|IFF_RUNNING)) != (IFF_UP|IFF_RUNNING)) {
788 		m_freem(m);
789 		return (ENETDOWN);
790 	}
791 
792 	b = &priv->fec_bundle;
793 
794 	switch (b->fec_btype) {
795 	case FEC_BTYPE_MAC:
796 		m->m_flags |= M_FEC_MAC;
797 		break;
798 #ifdef INET
799 	case FEC_BTYPE_INET:
800 		/*
801 		 * We can't use the INET address port selection
802 		 * scheme if this isn't an INET packet.
803 		 */
804 		if (dst->sa_family == AF_INET)
805 			m->m_flags |= M_FEC_INET;
806 #ifdef INET6
807 		else if (dst->sa_family == AF_INET6)
808 			m->m_flags |= M_FEC_INET6;
809 #endif
810 		else {
811 #ifdef DEBUG
812 			printf("fec%d: can't do inet aggregation of non "
813 			    "inet packet\n", ifp->if_unit);
814 #endif
815 			m->m_flags |= M_FEC_MAC;
816 		}
817 		break;
818 #endif
819 	default:
820 		printf("fec%d: bogus hash type: %d\n", ifp->if_unit,
821 		    b->fec_btype);
822 		m_freem(m);
823 		return(EINVAL);
824 		break;
825 	}
826 
827 	/*
828 	 * Pass the frame to ether_output() for all the protocol
829 	 * handling. This will put the ethernet header on the packet
830 	 * for us.
831 	 */
832 	priv->if_error = 0;
833 	error = ether_output(ifp, m, dst, rt0);
834 	if (priv->if_error && !error)
835 		error = priv->if_error;
836 
837 	return(error);
838 }
839 
840 /*
841  * Apply a hash to the source and destination addresses in the packet
842  * in order to select an interface. Also check link status and handle
843  * dead links accordingly.
844  */
845 
846 static int
847 ng_fec_choose_port(struct ng_fec_bundle *b,
848 	struct mbuf *m, struct ifnet **ifp)
849 {
850 	struct ether_header	*eh;
851 	struct mbuf		*m0;
852 #ifdef INET
853 	struct ip		*ip;
854 #ifdef INET6
855 	struct ip6_hdr		*ip6;
856 #endif
857 #endif
858 
859 	struct ng_fec_portlist	*p;
860 	int			port = 0, mask;
861 
862 	/*
863 	 * If there are only two ports, mask off all but the
864 	 * last bit for XORing. If there are 4, mask off all
865 	 * but the last 2 bits.
866 	 */
867 	mask = b->fec_ifcnt == 2 ? 0x1 : 0x3;
868 	eh = mtod(m, struct ether_header *);
869 #ifdef INET
870 	ip = (struct ip *)(mtod(m, char *) +
871 	    sizeof(struct ether_header));
872 #ifdef INET6
873 	ip6 = (struct ip6_hdr *)(mtod(m, char *) +
874 	    sizeof(struct ether_header));
875 #endif
876 #endif
877 
878 	/*
879 	 * The fg_fec_output() routine is supposed to leave a
880 	 * flag for us in the mbuf that tells us what hash to
881 	 * use, but sometimes a new mbuf is prepended to the
882 	 * chain, so we have to search every mbuf in the chain
883 	 * to find the flags.
884 	 */
885 	m0 = m;
886 	while (m0) {
887 		if (m0->m_flags & (M_FEC_MAC|M_FEC_INET|M_FEC_INET6))
888 			break;
889 		m0 = m0->m_next;
890 	}
891 	if (m0 == NULL)
892 		return(EINVAL);
893 
894 	switch (m0->m_flags & (M_FEC_MAC|M_FEC_INET|M_FEC_INET6)) {
895 	case M_FEC_MAC:
896 		port = (eh->ether_dhost[5] ^
897 		    eh->ether_shost[5]) & mask;
898 		break;
899 #ifdef INET
900 	case M_FEC_INET:
901 		port = (ntohl(ip->ip_dst.s_addr) ^
902 		    ntohl(ip->ip_src.s_addr)) & mask;
903 		break;
904 #ifdef INET6
905 	case M_FEC_INET6:
906 		port = (ip6->ip6_dst.s6_addr[15] ^
907 		    ip6->ip6_dst.s6_addr[15]) & mask;
908 		break;
909 #endif
910 #endif
911 	default:
912 		return(EINVAL);
913 			break;
914 	}
915 
916 	TAILQ_FOREACH(p, &b->ng_fec_ports, fec_list) {
917 		if (port == p->fec_idx)
918 			break;
919 	}
920 
921 	/*
922 	 * Now that we've chosen a port, make sure it's
923 	 * alive. If it's not alive, cycle through the bundle
924 	 * looking for a port that is alive. If we don't find
925 	 * any, return an error.
926 	 */
927 	if (p->fec_ifstat != 1) {
928 		struct ng_fec_portlist	*n = NULL;
929 
930 		n = TAILQ_NEXT(p, fec_list);
931 		if (n == NULL)
932 			n = TAILQ_FIRST(&b->ng_fec_ports);
933 		while (n != p) {
934 			if (n->fec_ifstat == 1)
935 				break;
936 			n = TAILQ_NEXT(n, fec_list);
937 			if (n == NULL)
938 				n = TAILQ_FIRST(&b->ng_fec_ports);
939 		}
940 		if (n == p)
941 			return(EAGAIN);
942 		p = n;
943 	}
944 
945 	*ifp = p->fec_if;
946 
947 	return(0);
948 }
949 
950 /*
951  * Now that the packet has been run through ether_output(), yank it
952  * off our own send queue and stick it on the queue for the appropriate
953  * underlying physical interface. Note that if the interface's send
954  * queue is full, we save an error status in our private netgraph
955  * space which will eventually be handed up to ng_fec_output(), which
956  * will return it to the rest of the IP stack. We need to do this
957  * in order to duplicate the effect of ether_output() returning ENOBUFS
958  * when it detects that an interface's send queue is full. There's no
959  * other way to signal the error status from here since the if_start()
960  * routine is spec'ed to return void.
961  *
962  * Once the frame is queued, we call ether_output_frame() to initiate
963  * transmission.
964  */
965 static void
966 ng_fec_start(struct ifnet *ifp)
967 {
968 	struct ng_fec_private	*priv;
969 	struct ng_fec_bundle	*b;
970 	struct ifnet		*oifp = NULL;
971 	struct mbuf		*m0;
972 	int			error;
973 
974 	priv = ifp->if_softc;
975 	b = &priv->fec_bundle;
976 
977 	IF_DEQUEUE(&ifp->if_snd, m0);
978 	if (m0 == NULL)
979 		return;
980 
981 	if (ifp->if_bpf)
982 		bpf_mtap(ifp, m0);
983 
984 	/* Queue up packet on the proper port. */
985 	error = ng_fec_choose_port(b, m0, &oifp);
986 	if (error) {
987 		ifp->if_ierrors++;
988 		m_freem(m0);
989 		priv->if_error = ENOBUFS;
990 		return;
991 	}
992 	ifp->if_opackets++;
993 
994 	priv->if_error = ether_output_frame(oifp, m0);
995 	return;
996 }
997 
998 #ifdef DEBUG
999 /*
1000  * Display an ioctl to the virtual interface
1001  */
1002 
1003 static void
1004 ng_fec_print_ioctl(struct ifnet *ifp, int command, caddr_t data)
1005 {
1006 	char   *str;
1007 
1008 	switch (command & IOC_DIRMASK) {
1009 	case IOC_VOID:
1010 		str = "IO";
1011 		break;
1012 	case IOC_OUT:
1013 		str = "IOR";
1014 		break;
1015 	case IOC_IN:
1016 		str = "IOW";
1017 		break;
1018 	case IOC_INOUT:
1019 		str = "IORW";
1020 		break;
1021 	default:
1022 		str = "IO??";
1023 	}
1024 	log(LOG_DEBUG, "%s%d: %s('%c', %d, char[%d])\n",
1025 	       ifp->if_name, ifp->if_unit,
1026 	       str,
1027 	       IOCGROUP(command),
1028 	       command & 0xff,
1029 	       IOCPARM_LEN(command));
1030 }
1031 #endif /* DEBUG */
1032 
1033 /************************************************************************
1034 			NETGRAPH NODE STUFF
1035  ************************************************************************/
1036 
1037 /*
1038  * Constructor for a node
1039  */
1040 static int
1041 ng_fec_constructor(node_p *nodep)
1042 {
1043 	char ifname[NG_FEC_FEC_NAME_MAX + 1];
1044 	struct ifnet *ifp;
1045 	node_p node;
1046 	priv_p priv;
1047 	struct ng_fec_bundle *b;
1048 	int error = 0;
1049 
1050 	/* Allocate node and interface private structures */
1051 	MALLOC(priv, priv_p, sizeof(*priv), M_NETGRAPH, M_NOWAIT);
1052 	if (priv == NULL)
1053 		return (ENOMEM);
1054 	bzero(priv, sizeof(*priv));
1055 
1056 	ifp = &priv->arpcom.ac_if;
1057 	b = &priv->fec_bundle;
1058 
1059 	/* Link them together */
1060 	ifp->if_softc = priv;
1061 
1062 	/* Get an interface unit number */
1063 	if ((error = ng_fec_get_unit(&priv->unit)) != 0) {
1064 		FREE(ifp, M_NETGRAPH);
1065 		FREE(priv, M_NETGRAPH);
1066 		return (error);
1067 	}
1068 
1069 	/* Call generic node constructor */
1070 	if ((error = ng_make_node_common(&typestruct, nodep)) != 0) {
1071 		ng_fec_free_unit(priv->unit);
1072 		FREE(ifp, M_NETGRAPH);
1073 		FREE(priv, M_NETGRAPH);
1074 		return (error);
1075 	}
1076 	node = *nodep;
1077 
1078 	/* Link together node and private info */
1079 	node->private = priv;
1080 	priv->node = node;
1081 	priv->arpcom.ac_netgraph = node;
1082 
1083 	/* Initialize interface structure */
1084 	ifp->if_name = NG_FEC_FEC_NAME;
1085 	ifp->if_unit = priv->unit;
1086 	ifp->if_output = ng_fec_output;
1087 	ifp->if_start = ng_fec_start;
1088 	ifp->if_ioctl = ng_fec_ioctl;
1089 	ifp->if_init = ng_fec_init;
1090 	ifp->if_watchdog = NULL;
1091 	ifp->if_snd.ifq_maxlen = IFQ_MAXLEN;
1092 	ifp->if_mtu = NG_FEC_MTU_DEFAULT;
1093 	ifp->if_flags = (IFF_SIMPLEX|IFF_BROADCAST|IFF_MULTICAST);
1094 	ifp->if_type = IFT_PROPVIRTUAL;		/* XXX */
1095 	ifp->if_addrlen = 0;			/* XXX */
1096 	ifp->if_hdrlen = 0;			/* XXX */
1097 	ifp->if_baudrate = 100000000;		/* XXX */
1098 	TAILQ_INIT(&ifp->if_addrhead);
1099 
1100 	/* Give this node the same name as the interface (if possible) */
1101 	bzero(ifname, sizeof(ifname));
1102 	snprintf(ifname, sizeof(ifname), "%s%d", ifp->if_name, ifp->if_unit);
1103 	if (ng_name_node(node, ifname) != 0)
1104 		log(LOG_WARNING, "%s: can't acquire netgraph name\n", ifname);
1105 
1106 	/* Grab hold of the ether_input pipe. */
1107 	if (ng_ether_input_p == NULL)
1108 		ng_ether_input_p = ng_fec_input;
1109 
1110 	/* Attach the interface */
1111 	ether_ifattach(ifp, ETHER_BPF_SUPPORTED);
1112 	callout_handle_init(&priv->fec_ch);
1113 
1114 	TAILQ_INIT(&b->ng_fec_ports);
1115 	b->fec_ifcnt = 0;
1116 
1117 	ifmedia_init(&priv->ifmedia, 0,
1118 	    ng_fec_ifmedia_upd, ng_fec_ifmedia_sts);
1119 	ifmedia_add(&priv->ifmedia, IFM_ETHER|IFM_NONE, 0, NULL);
1120 	ifmedia_set(&priv->ifmedia, IFM_ETHER|IFM_NONE);
1121 
1122 	/* Done */
1123 	return (0);
1124 }
1125 
1126 /*
1127  * Receive a control message
1128  */
1129 static int
1130 ng_fec_rcvmsg(node_p node, struct ng_mesg *msg,
1131 		const char *retaddr, struct ng_mesg **rptr)
1132 {
1133 	const priv_p priv = node->private;
1134 	struct ng_fec_bundle	*b;
1135 	struct ng_mesg *resp = NULL;
1136 	char *ifname;
1137 	int error = 0;
1138 
1139 	b = &priv->fec_bundle;
1140 
1141 	switch (msg->header.typecookie) {
1142 	case NGM_FEC_COOKIE:
1143 		switch (msg->header.cmd) {
1144 		case NGM_FEC_ADD_IFACE:
1145 			ifname = msg->data;
1146 			error = ng_fec_addport(priv, ifname);
1147 			break;
1148 		case NGM_FEC_DEL_IFACE:
1149 			ifname = msg->data;
1150 			error = ng_fec_delport(priv, ifname);
1151 			break;
1152 		case NGM_FEC_SET_MODE_MAC:
1153 			b->fec_btype = FEC_BTYPE_MAC;
1154 			break;
1155 #ifdef INET
1156 		case NGM_FEC_SET_MODE_INET:
1157 			b->fec_btype = FEC_BTYPE_INET;
1158 			break;
1159 #ifdef INET6
1160 		case NGM_FEC_SET_MODE_INET6:
1161 			b->fec_btype = FEC_BTYPE_INET6;
1162 			break;
1163 #endif
1164 #endif
1165 		default:
1166 			error = EINVAL;
1167 			break;
1168 		}
1169 		break;
1170 	default:
1171 		error = EINVAL;
1172 		break;
1173 	}
1174 	if (rptr)
1175 		*rptr = resp;
1176 	else if (resp)
1177 		FREE(resp, M_NETGRAPH);
1178 	FREE(msg, M_NETGRAPH);
1179 	return (error);
1180 }
1181 
1182 /*
1183  * Shutdown and remove the node and its associated interface.
1184  */
1185 static int
1186 ng_fec_rmnode(node_p node)
1187 {
1188 	const priv_p priv = node->private;
1189 	struct ng_fec_bundle *b;
1190 	struct ng_fec_portlist	*p;
1191 	char ifname[IFNAMSIZ];
1192 
1193 	b = &priv->fec_bundle;
1194 	ng_fec_stop(&priv->arpcom.ac_if);
1195 
1196 	while (!TAILQ_EMPTY(&b->ng_fec_ports)) {
1197 		p = TAILQ_FIRST(&b->ng_fec_ports);
1198 		sprintf(ifname, "%s%d",
1199 		    p->fec_if->if_name,
1200 		    p->fec_if->if_unit);
1201 		ng_fec_delport(priv, ifname);
1202 	}
1203 
1204 	ng_cutlinks(node);
1205 	ng_unname(node);
1206 	if (ng_ether_input_p != NULL)
1207 		ng_ether_input_p = NULL;
1208 	ether_ifdetach(&priv->arpcom.ac_if, ETHER_BPF_SUPPORTED);
1209 	ifmedia_removeall(&priv->ifmedia);
1210 	ng_fec_free_unit(priv->unit);
1211 	FREE(priv, M_NETGRAPH);
1212 	node->private = NULL;
1213 	ng_unref(node);
1214 	return (0);
1215 }
1216