1 /*-
2  * Copyright (c) 1990 The Regents of the University of California.
3  * Copyright (c) 2008 The DragonFly Project.
4  * All rights reserved.
5  *
6  * This code is derived from software contributed to Berkeley by
7  * William Jolitz.
8  *
9  * Redistribution and use in source and binary forms, with or without
10  * modification, are permitted provided that the following conditions
11  * are met:
12  * 1. Redistributions of source code must retain the above copyright
13  *    notice, this list of conditions and the following disclaimer.
14  * 2. Redistributions in binary form must reproduce the above copyright
15  *    notice, this list of conditions and the following disclaimer in the
16  *    documentation and/or other materials provided with the distribution.
17  * 3. Neither the name of the University nor the names of its contributors
18  *    may be used to endorse or promote products derived from this software
19  *    without specific prior written permission.
20  *
21  * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
22  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
23  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
24  * ARE DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
25  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
26  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
27  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
28  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
29  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
30  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
31  * SUCH DAMAGE.
32  *
33  *	from: @(#)autoconf.c	7.1 (Berkeley) 5/9/91
34  * $FreeBSD: src/sys/i386/i386/autoconf.c,v 1.146.2.2 2001/06/07 06:05:58 dd Exp $
35  */
36 
37 /*
38  * Setup the system to run on the current machine.
39  *
40  * Configure() is called at boot time and initializes the vba
41  * device tables and the memory controller monitoring.  Available
42  * devices are determined (from possibilities mentioned in ioconf.c),
43  * and the drivers are initialized.
44  */
45 #include "opt_bootp.h"
46 #include "opt_ffs.h"
47 #include "opt_cd9660.h"
48 #include "opt_nfs.h"
49 #include "opt_nfsroot.h"
50 #include "opt_rootdevname.h"
51 
52 #include "use_isa.h"
53 
54 #include <sys/param.h>
55 #include <sys/systm.h>
56 #include <sys/bootmaj.h>
57 #include <sys/bus.h>
58 #include <sys/buf.h>
59 #include <sys/conf.h>
60 #include <sys/diskslice.h>
61 #include <sys/reboot.h>
62 #include <sys/kernel.h>
63 #include <sys/malloc.h>
64 #include <sys/mount.h>
65 #include <sys/cons.h>
66 #include <sys/thread.h>
67 #include <sys/device.h>
68 #include <sys/machintr.h>
69 
70 #include <vm/vm_kern.h>
71 #include <vm/vm_extern.h>
72 #include <vm/vm_pager.h>
73 
74 #if 0
75 #include <machine/pcb.h>
76 #include <machine/pcb_ext.h>
77 #endif
78 #include <machine/smp.h>
79 #include <machine/globaldata.h>
80 #include <machine/md_var.h>
81 
82 #if NISA > 0
83 #include <bus/isa/isavar.h>
84 
85 device_t isa_bus_device = NULL;
86 #endif
87 
88 static void cpu_startup (void *);
89 static void configure_first (void *);
90 static void configure (void *);
91 static void configure_final (void *);
92 
93 #if defined(FFS) && defined(FFS_ROOT)
94 static void	setroot (void);
95 #endif
96 
97 #if defined(NFS) && defined(NFS_ROOT)
98 #if !defined(BOOTP_NFSROOT)
99 static void	pxe_setup_nfsdiskless(void);
100 #endif
101 #endif
102 
103 SYSINIT(cpu, SI_BOOT2_START_CPU, SI_ORDER_FIRST, cpu_startup, NULL);
104 SYSINIT(configure1, SI_SUB_CONFIGURE, SI_ORDER_FIRST, configure_first, NULL);
105 /* SI_ORDER_SECOND is hookable */
106 SYSINIT(configure2, SI_SUB_CONFIGURE, SI_ORDER_THIRD, configure, NULL);
107 /* SI_ORDER_MIDDLE is hookable */
108 SYSINIT(configure3, SI_SUB_CONFIGURE, SI_ORDER_ANY, configure_final, NULL);
109 
110 cdev_t	rootdev = NULL;
111 cdev_t	dumpdev = NULL;
112 
113 /*
114  * nfsroot.iosize may be set in loader.conf, 32768 is recommended to
115  * be able to max-out a GigE link if the server supports it.  Many servers
116  * do not so the default is 8192.
117  *
118  * nfsroot.rahead defaults to something reasonable, can be overridden.
119  */
120 static int nfsroot_iosize = 8192;
121 TUNABLE_INT("nfsroot.iosize", &nfsroot_iosize);
122 static int nfsroot_rahead = 4;
123 TUNABLE_INT("nfsroot.rahead", &nfsroot_rahead);
124 
125 /*
126  *
127  */
128 static void
129 cpu_startup(void *dummy)
130 {
131 	vm_offset_t buffer_sva;
132 	vm_offset_t buffer_eva;
133 	vm_offset_t pager_sva;
134 	vm_offset_t pager_eva;
135 
136 	kprintf("%s", version);
137 	kprintf("real memory = %ju (%juK bytes)\n",
138 	    (uintmax_t)ptoa(Maxmem), (uintmax_t)(ptoa(Maxmem) / 1024));
139 
140 	if (nbuf == 0) {
141 		int factor = 4 * NBUFCALCSIZE / 1024;
142 		int kbytes = Maxmem * (PAGE_SIZE / 1024);
143 
144 		nbuf = 50;
145 		if (kbytes > 4096)
146 			nbuf += min((kbytes - 4096) / factor, 65536 / factor);
147 		if (kbytes > 65536)
148 			nbuf += (kbytes - 65536) * 2 / (factor * 5);
149 		if (maxbcache && nbuf > maxbcache / NBUFCALCSIZE)
150 			nbuf = maxbcache / NBUFCALCSIZE;
151 	}
152 	if (nbuf > (virtual_end - virtual_start) / (MAXBSIZE * 2)) {
153 		nbuf = (virtual_end - virtual_start) / (MAXBSIZE * 2);
154 		kprintf("Warning: nbufs capped at %ld\n", nbuf);
155 	}
156 
157 	nswbuf_mem = lmax(lmin(nbuf / 32, 32), 4);
158 #ifdef NSWBUF_MIN
159 	if (nswbuf_mem < NSWBUF_MIN)
160 		nswbuf_mem = NSWBUF_MIN;
161 #endif
162 	nswbuf_kva = lmax(lmin(nbuf / 4, 256), 16);
163 #ifdef NSWBUF_MIN
164 	if (nswbuf_kva < NSWBUF_MIN)
165 		nswbuf_kva = NSWBUF_MIN;
166 #endif
167 
168 	/*
169 	 * Allocate memory for the buffer cache
170 	 */
171 	buf = (void *)kmem_alloc(&kernel_map,
172 				 nbuf * sizeof(struct buf),
173 				 VM_SUBSYS_BUF);
174 	swbuf_mem = (void *)kmem_alloc(&kernel_map,
175 				       nswbuf_mem * sizeof(struct buf),
176 				       VM_SUBSYS_BUF);
177 	swbuf_kva = (void *)kmem_alloc(&kernel_map,
178 				       nswbuf_kva * sizeof(struct buf),
179 				       VM_SUBSYS_BUF);
180 
181 #ifdef DIRECTIO
182         ffs_rawread_setup();
183 #endif
184 	kmem_suballoc(&kernel_map, &clean_map, &clean_sva, &clean_eva,
185 		      (nbuf * MAXBSIZE * 2) +
186 		      (nswbuf_mem + nswbuf_kva) *MAXPHYS +
187 		      pager_map_size);
188 	kmem_suballoc(&clean_map, &buffer_map, &buffer_sva, &buffer_eva,
189 		      (nbuf * MAXBSIZE * 2));
190 	buffer_map.system_map = 1;
191 	kmem_suballoc(&clean_map, &pager_map, &pager_sva, &pager_eva,
192 		      (nswbuf_mem + nswbuf_kva) *MAXPHYS +
193 		      pager_map_size);
194 	pager_map.system_map = 1;
195 	kprintf("avail memory = %lu (%luK bytes)\n", ptoa(vmstats.v_free_count),
196 		ptoa(vmstats.v_free_count) / 1024);
197 	mp_start();
198 	mp_announce();
199 	cpu_setregs();
200 }
201 
202 /*
203  * Determine i/o configuration for a machine.
204  */
205 static void
206 configure_first(void *dummy)
207 {
208 }
209 
210 static void
211 configure(void *dummy)
212 {
213         /*
214 	 * Final interrupt support acviation, then enable hardware interrupts.
215 	 */
216 	MachIntrABI.finalize();
217 	cpu_enable_intr();
218 
219 	/*
220 	 * This will configure all devices, generally starting with the
221 	 * nexus (i386/i386/nexus.c).  The nexus ISA code explicitly
222 	 * dummies up the attach in order to delay legacy initialization
223 	 * until after all other busses/subsystems have had a chance
224 	 * at those resources.
225 	 */
226 	root_bus_configure();
227 
228 #if NISA > 0
229 	/*
230 	 * Explicitly probe and attach ISA last.  The isa bus saves
231 	 * it's device node at attach time for us here.
232 	 */
233 	if (isa_bus_device)
234 		isa_probe_children(isa_bus_device);
235 #endif
236 
237 	/*
238 	 * Allow lowering of the ipl to the lowest kernel level if we
239 	 * panic (or call tsleep() before clearing `cold').  No level is
240 	 * completely safe (since a panic may occur in a critical region
241 	 * at splhigh()), but we want at least bio interrupts to work.
242 	 */
243 	safepri = TDPRI_KERN_USER;
244 }
245 
246 static void
247 configure_final(void *dummy)
248 {
249 	cninit_finish();
250 
251 	if (bootverbose)
252 		kprintf("Device configuration finished.\n");
253 }
254 
255 #ifdef BOOTP
256 void bootpc_init(void);
257 #endif
258 /*
259  * Do legacy root filesystem discovery.
260  */
261 void
262 cpu_rootconf(void)
263 {
264 #ifdef BOOTP
265         bootpc_init();
266 #endif
267 #if defined(NFS) && defined(NFS_ROOT)
268 #if !defined(BOOTP_NFSROOT)
269 	pxe_setup_nfsdiskless();
270 	if (nfs_diskless_valid)
271 #endif
272 		rootdevnames[0] = "nfs:";
273 #endif
274 #if defined(FFS) && defined(FFS_ROOT)
275         if (!rootdevnames[0])
276                 setroot();
277 #endif
278 }
279 SYSINIT(cpu_rootconf, SI_SUB_ROOT_CONF, SI_ORDER_FIRST, cpu_rootconf, NULL);
280 
281 u_long	bootdev = 0;		/* not a cdev_t - encoding is different */
282 
283 #if defined(FFS) && defined(FFS_ROOT)
284 
285 /*
286  * The boot code uses old block device major numbers to pass bootdev to
287  * us.  We have to translate these to character device majors because
288  * we don't have block devices any more.
289  */
290 static int
291 boot_translate_majdev(int bmajor)
292 {
293 	static int conv[] = { BOOTMAJOR_CONVARY };
294 
295 	if (bmajor >= 0 && bmajor < NELEM(conv))
296 		return(conv[bmajor]);
297 	return(-1);
298 }
299 
300 /*
301  * Attempt to find the device from which we were booted.
302  * If we can do so, and not instructed not to do so,
303  * set rootdevs[] and rootdevnames[] to correspond to the
304  * boot device(s).
305  *
306  * This code survives in order to allow the system to be
307  * booted from legacy environments that do not correctly
308  * populate the kernel environment. There are significant
309  * restrictions on the bootability of the system in this
310  * situation; it can only be mounting root from a 'da'
311  * 'wd' or 'fd' device, and the root filesystem must be ufs.
312  */
313 static void
314 setroot(void)
315 {
316 	int majdev, mindev, unit, slice, part;
317 	cdev_t newrootdev, dev;
318 	char partname[2];
319 	char *sname;
320 
321 	if ((bootdev & B_MAGICMASK) != B_DEVMAGIC) {
322 		kprintf("no B_DEVMAGIC (bootdev=%#lx)\n", bootdev);
323 		return;
324 	}
325 	majdev = boot_translate_majdev(B_TYPE(bootdev));
326 	if (bootverbose) {
327 		kprintf("bootdev: %08lx type=%ld unit=%ld "
328 			"slice=%ld part=%ld major=%d\n",
329 			bootdev, B_TYPE(bootdev), B_UNIT(bootdev),
330 			B_SLICE(bootdev), B_PARTITION(bootdev), majdev);
331 	}
332 	dev = udev2dev(makeudev(majdev, 0), 0);
333 	if (!dev_is_good(dev))
334 		return;
335 	unit = B_UNIT(bootdev);
336 	slice = B_SLICE(bootdev);
337 	if (slice == WHOLE_DISK_SLICE)
338 		slice = COMPATIBILITY_SLICE;
339 	if (slice < 0 || slice >= MAX_SLICES) {
340 		kprintf("bad slice\n");
341 		return;
342 	}
343 
344 	part = B_PARTITION(bootdev);
345 	mindev = dkmakeminor(unit, slice, part);
346 	newrootdev = udev2dev(makeudev(majdev, mindev), 0);
347 	if (!dev_is_good(newrootdev))
348 		return;
349 	sname = dsname(newrootdev, unit, slice, part, partname);
350 	rootdevnames[0] = kmalloc(strlen(sname) + 6, M_DEVBUF, M_WAITOK);
351 	ksprintf(rootdevnames[0], "ufs:%s%s", sname, partname);
352 
353 	/*
354 	 * For properly dangerously dedicated disks (ones with a historical
355 	 * bogus partition table), the boot blocks will give slice = 4, but
356 	 * the kernel will only provide the compatibility slice since it
357 	 * knows that slice 4 is not a real slice.  Arrange to try mounting
358 	 * the compatibility slice as root if mounting the slice passed by
359 	 * the boot blocks fails.  This handles the dangerously dedicated
360 	 * case and perhaps others.
361 	 */
362 	if (slice == COMPATIBILITY_SLICE)
363 		return;
364 	slice = COMPATIBILITY_SLICE;
365 	sname = dsname(newrootdev, unit, slice, part, partname);
366 	rootdevnames[1] = kmalloc(strlen(sname) + 6, M_DEVBUF, M_WAITOK);
367 	ksprintf(rootdevnames[1], "ufs:%s%s", sname, partname);
368 }
369 #endif
370 
371 #if defined(NFS) && defined(NFS_ROOT)
372 #if !defined(BOOTP_NFSROOT)
373 
374 #include <sys/socket.h>
375 #include <net/if.h>
376 #include <net/if_dl.h>
377 #include <net/if_types.h>
378 #include <net/if_var.h>
379 #include <net/ethernet.h>
380 #include <netinet/in.h>
381 #include <vfs/nfs/rpcv2.h>
382 #include <vfs/nfs/nfsproto.h>
383 #include <vfs/nfs/nfs.h>
384 #include <vfs/nfs/nfsdiskless.h>
385 
386 extern struct nfs_diskless	nfs_diskless;
387 
388 /*
389  * Convert a kenv variable to a sockaddr.  If the kenv variable does not
390  * exist the sockaddr will remain zerod out (callers typically just check
391  * sin_len).  A network address of 0.0.0.0 is equivalent to failure.
392  */
393 static int
394 inaddr_to_sockaddr(char *ev, struct sockaddr_in *sa)
395 {
396 	u_int32_t	a[4];
397 	char		*cp;
398 
399 	bzero(sa, sizeof(*sa));
400 
401 	if ((cp = kgetenv(ev)) == NULL)
402 		return(1);
403 	if (ksscanf(cp, "%d.%d.%d.%d", &a[0], &a[1], &a[2], &a[3]) != 4)
404 		return(1);
405 	if (a[0] == 0 && a[1] == 0 && a[2] == 0 && a[3] == 0)
406 		return(1);
407 	/* XXX is this ordering correct? */
408 	sa->sin_addr.s_addr = (a[3] << 24) + (a[2] << 16) + (a[1] << 8) + a[0];
409 	sa->sin_len = sizeof(*sa);
410 	sa->sin_family = AF_INET;
411 	return(0);
412 }
413 
414 static int
415 hwaddr_to_sockaddr(char *ev, struct sockaddr_dl *sa)
416 {
417 	char		*cp;
418 	u_int32_t	a[6];
419 
420 	bzero(sa, sizeof(*sa));
421 	sa->sdl_len = sizeof(*sa);
422 	sa->sdl_family = AF_LINK;
423 	sa->sdl_type = IFT_ETHER;
424 	sa->sdl_alen = ETHER_ADDR_LEN;
425 	if ((cp = kgetenv(ev)) == NULL)
426 		return(1);
427 	if (ksscanf(cp, "%x:%x:%x:%x:%x:%x", &a[0], &a[1], &a[2], &a[3], &a[4], &a[5]) != 6)
428 		return(1);
429 	sa->sdl_data[0] = a[0];
430 	sa->sdl_data[1] = a[1];
431 	sa->sdl_data[2] = a[2];
432 	sa->sdl_data[3] = a[3];
433 	sa->sdl_data[4] = a[4];
434 	sa->sdl_data[5] = a[5];
435 	return(0);
436 }
437 
438 static int
439 decode_nfshandle(char *ev, u_char *fh)
440 {
441 	u_char	*cp;
442 	int	len, val;
443 
444 	if (((cp = kgetenv(ev)) == NULL) || (strlen(cp) < 2) || (*cp != 'X'))
445 		return(0);
446 	len = 0;
447 	cp++;
448 	for (;;) {
449 		if (*cp == 'X')
450 			return(len);
451 		if ((ksscanf(cp, "%2x", &val) != 1) || (val > 0xff))
452 			return(0);
453 		*(fh++) = val;
454 		len++;
455 		cp += 2;
456 		if (len > NFSX_V2FH)
457 		    return(0);
458 	}
459 }
460 
461 /*
462  * Populate the essential fields in the nfsv3_diskless structure.
463  *
464  * The loader is expected to export the following environment variables:
465  *
466  * boot.netif.ip		IP address on boot interface
467  * boot.netif.netmask		netmask on boot interface
468  * boot.netif.gateway		default gateway (optional)
469  * boot.netif.hwaddr		hardware address of boot interface
470  * boot.netif.name		name of boot interface (instead of hw addr)
471  * boot.nfsroot.server		IP address of root filesystem server
472  * boot.nfsroot.path		path of the root filesystem on server
473  * boot.nfsroot.nfshandle	NFS handle for root filesystem on server
474  */
475 static void
476 pxe_setup_nfsdiskless(void)
477 {
478 	struct nfs_diskless	*nd = &nfs_diskless;
479 	struct ifnet		*ifp;
480 	struct ifaddr		*ifa;
481 	struct sockaddr_dl	*sdl, ourdl;
482 	struct sockaddr_in	myaddr, netmask;
483 	char			*cp;
484 
485 	/* set up interface */
486 	if (inaddr_to_sockaddr("boot.netif.ip", &myaddr))
487 		return;
488 	if (inaddr_to_sockaddr("boot.netif.netmask", &netmask)) {
489 		kprintf("PXE: no netmask\n");
490 		return;
491 	}
492 	bcopy(&myaddr, &nd->myif.ifra_addr, sizeof(myaddr));
493 	bcopy(&myaddr, &nd->myif.ifra_broadaddr, sizeof(myaddr));
494 	((struct sockaddr_in *) &nd->myif.ifra_broadaddr)->sin_addr.s_addr =
495 		myaddr.sin_addr.s_addr | ~ netmask.sin_addr.s_addr;
496 	bcopy(&netmask, &nd->myif.ifra_mask, sizeof(netmask));
497 
498 	if ((cp = kgetenv("boot.netif.name")) != NULL) {
499 		ifnet_lock();
500 		ifp = ifunit(cp);
501 		if (ifp) {
502 			strlcpy(nd->myif.ifra_name, ifp->if_xname,
503 			    sizeof(nd->myif.ifra_name));
504 			ifnet_unlock();
505 			goto match_done;
506 		}
507 		ifnet_unlock();
508 		kprintf("PXE: cannot find interface %s\n", cp);
509 		return;
510 	}
511 
512 	if (hwaddr_to_sockaddr("boot.netif.hwaddr", &ourdl)) {
513 		kprintf("PXE: no hardware address\n");
514 		return;
515 	}
516 	ifa = NULL;
517 	ifnet_lock();
518 	TAILQ_FOREACH(ifp, &ifnetlist, if_link) {
519 		struct ifaddr_container *ifac;
520 
521 		TAILQ_FOREACH(ifac, &ifp->if_addrheads[mycpuid], ifa_link) {
522 			ifa = ifac->ifa;
523 
524 			if ((ifa->ifa_addr->sa_family == AF_LINK) &&
525 			    (sdl = ((struct sockaddr_dl *)ifa->ifa_addr))) {
526 				if ((sdl->sdl_type == ourdl.sdl_type) &&
527 				    (sdl->sdl_alen == ourdl.sdl_alen) &&
528 				    !bcmp(sdl->sdl_data + sdl->sdl_nlen,
529 					  ourdl.sdl_data + ourdl.sdl_nlen,
530 					  sdl->sdl_alen)) {
531 					strlcpy(nd->myif.ifra_name,
532 					    ifp->if_xname,
533 					    sizeof(nd->myif.ifra_name));
534 					ifnet_unlock();
535 					goto match_done;
536 				}
537 			}
538 		}
539 	}
540 	ifnet_unlock();
541 	kprintf("PXE: no interface\n");
542 	return;	/* no matching interface */
543 match_done:
544 	/* set up gateway */
545 	inaddr_to_sockaddr("boot.netif.gateway", &nd->mygateway);
546 
547 	/* XXX set up swap? */
548 
549 	/* set up root mount */
550 	nd->root_args.rsize = nfsroot_iosize;
551 	nd->root_args.wsize = nfsroot_iosize;
552 	nd->root_args.sotype = SOCK_STREAM;
553 	nd->root_args.readahead = nfsroot_rahead;
554 	nd->root_args.flags = NFSMNT_WSIZE | NFSMNT_RSIZE | NFSMNT_RESVPORT |
555 			      NFSMNT_READAHEAD;
556 	if (inaddr_to_sockaddr("boot.nfsroot.server", &nd->root_saddr)) {
557 		kprintf("PXE: no server\n");
558 		return;
559 	}
560 	nd->root_saddr.sin_port = htons(NFS_PORT);
561 
562 	/*
563 	 * A tftp-only loader may pass NFS path information without a
564 	 * root handle.  Generate a warning but continue configuring.
565 	 */
566 	if (decode_nfshandle("boot.nfsroot.nfshandle", &nd->root_fh[0]) == 0) {
567 		kprintf("PXE: Warning, no NFS handle passed from loader\n");
568 	}
569 	if ((cp = kgetenv("boot.nfsroot.path")) != NULL)
570 		strncpy(nd->root_hostnam, cp, MNAMELEN - 1);
571 
572 	nfs_diskless_valid = 1;
573 }
574 
575 #endif
576 #endif
577