1 /*- 2 * Copyright (c) 1990 The Regents of the University of California. 3 * Copyright (c) 2008 The DragonFly Project. 4 * All rights reserved. 5 * 6 * This code is derived from software contributed to Berkeley by 7 * William Jolitz. 8 * 9 * Redistribution and use in source and binary forms, with or without 10 * modification, are permitted provided that the following conditions 11 * are met: 12 * 1. Redistributions of source code must retain the above copyright 13 * notice, this list of conditions and the following disclaimer. 14 * 2. Redistributions in binary form must reproduce the above copyright 15 * notice, this list of conditions and the following disclaimer in the 16 * documentation and/or other materials provided with the distribution. 17 * 3. Neither the name of the University nor the names of its contributors 18 * may be used to endorse or promote products derived from this software 19 * without specific prior written permission. 20 * 21 * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND 22 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE 23 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE 24 * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE 25 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL 26 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS 27 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) 28 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT 29 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY 30 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF 31 * SUCH DAMAGE. 32 * 33 * from: @(#)autoconf.c 7.1 (Berkeley) 5/9/91 34 * $FreeBSD: src/sys/i386/i386/autoconf.c,v 1.146.2.2 2001/06/07 06:05:58 dd Exp $ 35 */ 36 37 /* 38 * Setup the system to run on the current machine. 39 * 40 * Configure() is called at boot time and initializes the vba 41 * device tables and the memory controller monitoring. Available 42 * devices are determined (from possibilities mentioned in ioconf.c), 43 * and the drivers are initialized. 44 */ 45 #include "opt_bootp.h" 46 #include "opt_cd9660.h" 47 #include "opt_nfs.h" 48 #include "opt_nfsroot.h" 49 #include "opt_rootdevname.h" 50 #include "opt_swap.h" 51 52 #include "use_isa.h" 53 54 #include <sys/param.h> 55 #include <sys/systm.h> 56 #include <sys/bootmaj.h> 57 #include <sys/bus.h> 58 #include <sys/buf.h> 59 #include <sys/conf.h> 60 #include <sys/diskslice.h> 61 #include <sys/reboot.h> 62 #include <sys/kernel.h> 63 #include <sys/malloc.h> 64 #include <sys/mount.h> 65 #include <sys/cons.h> 66 #include <sys/thread.h> 67 #include <sys/device.h> 68 #include <sys/machintr.h> 69 70 #include <vm/vm_kern.h> 71 #include <vm/vm_extern.h> 72 #include <vm/vm_pager.h> 73 74 #if 0 75 #include <machine/pcb.h> 76 #include <machine/pcb_ext.h> 77 #endif 78 #include <machine/smp.h> 79 #include <machine/globaldata.h> 80 #include <machine/md_var.h> 81 82 #define MAXBUFSTRUCTSIZE ((size_t)512 * 1024 * 1024) 83 84 #if NISA > 0 85 #include <bus/isa/isavar.h> 86 87 device_t isa_bus_device = NULL; 88 #endif 89 90 static void cpu_startup (void *); 91 static void configure_first (void *); 92 static void configure (void *); 93 static void configure_final (void *); 94 95 #if defined(NFS) && defined(NFS_ROOT) 96 #if !defined(BOOTP_NFSROOT) 97 static void pxe_setup_nfsdiskless(void); 98 #endif 99 #endif 100 101 SYSINIT(cpu, SI_BOOT2_START_CPU, SI_ORDER_FIRST, cpu_startup, NULL); 102 SYSINIT(configure1, SI_SUB_CONFIGURE, SI_ORDER_FIRST, configure_first, NULL); 103 /* SI_ORDER_SECOND is hookable */ 104 SYSINIT(configure2, SI_SUB_CONFIGURE, SI_ORDER_THIRD, configure, NULL); 105 /* SI_ORDER_MIDDLE is hookable */ 106 SYSINIT(configure3, SI_SUB_CONFIGURE, SI_ORDER_ANY, configure_final, NULL); 107 108 cdev_t rootdev = NULL; 109 cdev_t dumpdev = NULL; 110 111 /* 112 * nfsroot.iosize may be set in loader.conf, 32768 is recommended to 113 * be able to max-out a GigE link if the server supports it. Many servers 114 * do not so the default is 8192. 115 * 116 * nfsroot.rahead defaults to something reasonable, can be overridden. 117 */ 118 static int nfsroot_iosize = 8192; 119 TUNABLE_INT("nfsroot.iosize", &nfsroot_iosize); 120 static int nfsroot_rahead = 4; 121 TUNABLE_INT("nfsroot.rahead", &nfsroot_rahead); 122 123 /* 124 * 125 */ 126 static void 127 cpu_startup(void *dummy) 128 { 129 vm_offset_t buffer_sva; 130 vm_offset_t buffer_eva; 131 vm_offset_t pager_sva; 132 vm_offset_t pager_eva; 133 134 kprintf("%s", version); 135 kprintf("real memory = %ju (%juK bytes)\n", 136 (uintmax_t)ptoa(Maxmem), (uintmax_t)(ptoa(Maxmem) / 1024)); 137 138 if (nbuf == 0) { 139 long factor = NBUFCALCSIZE / 1024; /* KB/nbuf */ 140 long kbytes = physmem * (PAGE_SIZE / 1024); /* physmem */ 141 142 nbuf = 50; 143 144 if (kbytes > 128 * 1024) 145 nbuf += (kbytes - 128 * 1024) / (factor * 20); 146 if (maxbcache && nbuf > maxbcache / NBUFCALCSIZE) 147 nbuf = maxbcache / NBUFCALCSIZE; 148 149 if ((size_t)nbuf * sizeof(struct buf) > MAXBUFSTRUCTSIZE) { 150 kprintf("Warning: nbuf capped at %ld due to the " 151 "reasonability limit\n", nbuf); 152 nbuf = MAXBUFSTRUCTSIZE / sizeof(struct buf); 153 } 154 } 155 156 if (nbuf > (virtual_end - virtual_start) / (MAXBSIZE * 4)) { 157 nbuf = (virtual_end - virtual_start) / (MAXBSIZE * 4); 158 kprintf("Warning: nbufs capped at %ld for " 159 "valloc considerations\n", nbuf); 160 } 161 162 nswbuf_mem = lmax(lmin(nbuf / 32, 32), 4); 163 #ifdef NSWBUF_MIN 164 if (nswbuf_mem < NSWBUF_MIN) 165 nswbuf_mem = NSWBUF_MIN; 166 #endif 167 nswbuf_kva = lmax(lmin(nbuf / 4, 256), 16); 168 #ifdef NSWBUF_MIN 169 if (nswbuf_kva < NSWBUF_MIN) 170 nswbuf_kva = NSWBUF_MIN; 171 #endif 172 173 /* 174 * Allocate memory for the buffer cache 175 */ 176 buf = (void *)kmem_alloc(kernel_map, 177 nbuf * sizeof(struct buf), 178 VM_SUBSYS_BUF); 179 swbuf_mem = (void *)kmem_alloc(kernel_map, 180 nswbuf_mem * sizeof(struct buf), 181 VM_SUBSYS_BUF); 182 swbuf_kva = (void *)kmem_alloc(kernel_map, 183 nswbuf_kva * sizeof(struct buf), 184 VM_SUBSYS_BUF); 185 186 kmem_suballoc(kernel_map, clean_map, &clean_sva, &clean_eva, 187 (nbuf * MAXBSIZE * 2) + 188 (nswbuf_mem + nswbuf_kva) * MAXPHYS + 189 pager_map_size); 190 kmem_suballoc(clean_map, buffer_map, &buffer_sva, &buffer_eva, 191 (nbuf * MAXBSIZE * 2)); 192 buffer_map->system_map = 1; 193 kmem_suballoc(clean_map, pager_map, &pager_sva, &pager_eva, 194 (nswbuf_mem + nswbuf_kva) * MAXPHYS + 195 pager_map_size); 196 pager_map->system_map = 1; 197 kprintf("avail memory = %lu (%luK bytes)\n", ptoa(vmstats.v_free_count), 198 ptoa(vmstats.v_free_count) / 1024); 199 mp_start(); 200 mp_announce(); 201 cpu_setregs(); 202 } 203 204 /* 205 * Determine i/o configuration for a machine. 206 */ 207 static void 208 configure_first(void *dummy) 209 { 210 } 211 212 static void 213 configure(void *dummy) 214 { 215 /* 216 * Final interrupt support acviation, then enable hardware interrupts. 217 */ 218 MachIntrABI.finalize(); 219 cpu_enable_intr(); 220 221 /* 222 * This will configure all devices, generally starting with the 223 * nexus (pc64/x86_64/nexus.c). The nexus ISA code explicitly 224 * dummies up the attach in order to delay legacy initialization 225 * until after all other busses/subsystems have had a chance 226 * at those resources. 227 */ 228 root_bus_configure(); 229 230 #if NISA > 0 231 /* 232 * Explicitly probe and attach ISA last. The isa bus saves 233 * it's device node at attach time for us here. 234 */ 235 if (isa_bus_device) 236 isa_probe_children(isa_bus_device); 237 #endif 238 239 /* 240 * Allow lowering of the ipl to the lowest kernel level if we 241 * panic (or call tsleep() before clearing `cold'). No level is 242 * completely safe (since a panic may occur in a critical region 243 * at splhigh()), but we want at least bio interrupts to work. 244 */ 245 safepri = TDPRI_KERN_USER; 246 } 247 248 /* 249 * Finalize configure. Reprobe for the console, in case it was one 250 * of the devices which attached, then finish console initialization. 251 */ 252 static void 253 configure_final(void *dummy) 254 { 255 cninit(); 256 cninit_finish(); 257 258 if (bootverbose) 259 kprintf("Device configuration finished.\n"); 260 } 261 262 #ifdef BOOTP 263 void bootpc_init(void); 264 #endif 265 /* 266 * Do legacy root filesystem discovery. 267 */ 268 void 269 cpu_rootconf(void) 270 { 271 #ifdef BOOTP 272 bootpc_init(); 273 #endif 274 #if defined(NFS) && defined(NFS_ROOT) 275 #if !defined(BOOTP_NFSROOT) 276 pxe_setup_nfsdiskless(); 277 if (nfs_diskless_valid) 278 #endif 279 rootdevnames[0] = "nfs:"; 280 #endif 281 } 282 SYSINIT(cpu_rootconf, SI_SUB_ROOT_CONF, SI_ORDER_FIRST, cpu_rootconf, NULL); 283 284 #if defined(NFS) && defined(NFS_ROOT) 285 #if !defined(BOOTP_NFSROOT) 286 287 #include <sys/socket.h> 288 #include <net/if.h> 289 #include <net/if_dl.h> 290 #include <net/if_types.h> 291 #include <net/if_var.h> 292 #include <net/ethernet.h> 293 #include <netinet/in.h> 294 #include <vfs/nfs/rpcv2.h> 295 #include <vfs/nfs/nfsproto.h> 296 #include <vfs/nfs/nfs.h> 297 #include <vfs/nfs/nfsdiskless.h> 298 299 extern struct nfs_diskless nfs_diskless; 300 301 /* 302 * Convert a kenv variable to a sockaddr. If the kenv variable does not 303 * exist the sockaddr will remain zerod out (callers typically just check 304 * sin_len). A network address of 0.0.0.0 is equivalent to failure. 305 */ 306 static int 307 inaddr_to_sockaddr(char *ev, struct sockaddr_in *sa) 308 { 309 u_int32_t a[4]; 310 char *cp; 311 312 bzero(sa, sizeof(*sa)); 313 314 if ((cp = kgetenv(ev)) == NULL) 315 return(1); 316 if (ksscanf(cp, "%d.%d.%d.%d", &a[0], &a[1], &a[2], &a[3]) != 4) 317 return(1); 318 if (a[0] == 0 && a[1] == 0 && a[2] == 0 && a[3] == 0) 319 return(1); 320 /* XXX is this ordering correct? */ 321 sa->sin_addr.s_addr = (a[3] << 24) + (a[2] << 16) + (a[1] << 8) + a[0]; 322 sa->sin_len = sizeof(*sa); 323 sa->sin_family = AF_INET; 324 return(0); 325 } 326 327 static int 328 hwaddr_to_sockaddr(char *ev, struct sockaddr_dl *sa) 329 { 330 char *cp; 331 u_int32_t a[6]; 332 333 bzero(sa, sizeof(*sa)); 334 sa->sdl_len = sizeof(*sa); 335 sa->sdl_family = AF_LINK; 336 sa->sdl_type = IFT_ETHER; 337 sa->sdl_alen = ETHER_ADDR_LEN; 338 if ((cp = kgetenv(ev)) == NULL) 339 return(1); 340 if (ksscanf(cp, "%x:%x:%x:%x:%x:%x", &a[0], &a[1], &a[2], &a[3], &a[4], &a[5]) != 6) 341 return(1); 342 sa->sdl_data[0] = a[0]; 343 sa->sdl_data[1] = a[1]; 344 sa->sdl_data[2] = a[2]; 345 sa->sdl_data[3] = a[3]; 346 sa->sdl_data[4] = a[4]; 347 sa->sdl_data[5] = a[5]; 348 return(0); 349 } 350 351 static int 352 decode_nfshandle(char *ev, u_char *fh) 353 { 354 u_char *cp; 355 int len, val; 356 357 if (((cp = kgetenv(ev)) == NULL) || (strlen(cp) < 2) || (*cp != 'X')) 358 return(0); 359 len = 0; 360 cp++; 361 for (;;) { 362 if (*cp == 'X') 363 return(len); 364 if ((ksscanf(cp, "%2x", &val) != 1) || (val > 0xff)) 365 return(0); 366 *(fh++) = val; 367 len++; 368 cp += 2; 369 if (len > NFSX_V2FH) 370 return(0); 371 } 372 } 373 374 /* 375 * Populate the essential fields in the nfsv3_diskless structure. 376 * 377 * The loader is expected to export the following environment variables: 378 * 379 * boot.netif.ip IP address on boot interface 380 * boot.netif.netmask netmask on boot interface 381 * boot.netif.gateway default gateway (optional) 382 * boot.netif.hwaddr hardware address of boot interface 383 * boot.netif.name name of boot interface (instead of hw addr) 384 * boot.nfsroot.server IP address of root filesystem server 385 * boot.nfsroot.path path of the root filesystem on server 386 * boot.nfsroot.nfshandle NFS handle for root filesystem on server 387 */ 388 static void 389 pxe_setup_nfsdiskless(void) 390 { 391 struct nfs_diskless *nd = &nfs_diskless; 392 struct ifnet *ifp; 393 struct ifaddr *ifa; 394 struct sockaddr_dl *sdl, ourdl; 395 struct sockaddr_in myaddr, netmask; 396 char *cp; 397 398 /* set up interface */ 399 if (inaddr_to_sockaddr("boot.netif.ip", &myaddr)) 400 return; 401 if (inaddr_to_sockaddr("boot.netif.netmask", &netmask)) { 402 kprintf("PXE: no netmask\n"); 403 return; 404 } 405 bcopy(&myaddr, &nd->myif.ifra_addr, sizeof(myaddr)); 406 bcopy(&myaddr, &nd->myif.ifra_broadaddr, sizeof(myaddr)); 407 ((struct sockaddr_in *) &nd->myif.ifra_broadaddr)->sin_addr.s_addr = 408 myaddr.sin_addr.s_addr | ~ netmask.sin_addr.s_addr; 409 bcopy(&netmask, &nd->myif.ifra_mask, sizeof(netmask)); 410 411 if ((cp = kgetenv("boot.netif.name")) != NULL) { 412 ifnet_lock(); 413 ifp = ifunit(cp); 414 if (ifp) { 415 strlcpy(nd->myif.ifra_name, ifp->if_xname, 416 sizeof(nd->myif.ifra_name)); 417 ifnet_unlock(); 418 goto match_done; 419 } 420 ifnet_unlock(); 421 kprintf("PXE: cannot find interface %s\n", cp); 422 return; 423 } 424 425 if (hwaddr_to_sockaddr("boot.netif.hwaddr", &ourdl)) { 426 kprintf("PXE: no hardware address\n"); 427 return; 428 } 429 ifa = NULL; 430 ifnet_lock(); 431 TAILQ_FOREACH(ifp, &ifnetlist, if_link) { 432 struct ifaddr_container *ifac; 433 434 TAILQ_FOREACH(ifac, &ifp->if_addrheads[mycpuid], ifa_link) { 435 ifa = ifac->ifa; 436 437 if ((ifa->ifa_addr->sa_family == AF_LINK) && 438 (sdl = ((struct sockaddr_dl *)ifa->ifa_addr))) { 439 if ((sdl->sdl_type == ourdl.sdl_type) && 440 (sdl->sdl_alen == ourdl.sdl_alen) && 441 !bcmp(sdl->sdl_data + sdl->sdl_nlen, 442 ourdl.sdl_data + ourdl.sdl_nlen, 443 sdl->sdl_alen)) { 444 strlcpy(nd->myif.ifra_name, 445 ifp->if_xname, 446 sizeof(nd->myif.ifra_name)); 447 ifnet_unlock(); 448 goto match_done; 449 } 450 } 451 } 452 } 453 ifnet_unlock(); 454 kprintf("PXE: no interface\n"); 455 return; /* no matching interface */ 456 match_done: 457 /* set up gateway */ 458 inaddr_to_sockaddr("boot.netif.gateway", &nd->mygateway); 459 460 /* XXX set up swap? */ 461 462 /* set up root mount */ 463 nd->root_args.rsize = nfsroot_iosize; 464 nd->root_args.wsize = nfsroot_iosize; 465 nd->root_args.sotype = SOCK_STREAM; 466 nd->root_args.readahead = nfsroot_rahead; 467 nd->root_args.flags = NFSMNT_WSIZE | NFSMNT_RSIZE | NFSMNT_RESVPORT | 468 NFSMNT_READAHEAD; 469 if (inaddr_to_sockaddr("boot.nfsroot.server", &nd->root_saddr)) { 470 kprintf("PXE: no server\n"); 471 return; 472 } 473 nd->root_saddr.sin_port = htons(NFS_PORT); 474 475 /* 476 * A tftp-only loader may pass NFS path information without a 477 * root handle. Generate a warning but continue configuring. 478 */ 479 if (decode_nfshandle("boot.nfsroot.nfshandle", &nd->root_fh[0]) == 0) { 480 kprintf("PXE: Warning, no NFS handle passed from loader\n"); 481 } 482 if ((cp = kgetenv("boot.nfsroot.path")) != NULL) 483 strncpy(nd->root_hostnam, cp, MNAMELEN - 1); 484 485 nfs_diskless_valid = 1; 486 } 487 488 #endif 489 #endif 490