1 /* 2 * ---------------------------------------------------------------------------- 3 * "THE BEER-WARE LICENSE" (Revision 42): 4 * <phk@FreeBSD.ORG> wrote this file. As long as you retain this notice you 5 * can do whatever you want with this stuff. If we meet some day, and you think 6 * this stuff is worth it, you can buy me a beer in return. Poul-Henning Kamp 7 * ---------------------------------------------------------------------------- 8 * 9 * $FreeBSD: src/sys/dev/md/md.c,v 1.8.2.2 2002/08/19 17:43:34 jdp Exp $ 10 * 11 */ 12 13 #include "opt_md.h" /* We have adopted some tasks from MFS */ 14 15 #include <sys/param.h> 16 #include <sys/systm.h> 17 #include <sys/buf.h> 18 #include <sys/conf.h> 19 #include <sys/devicestat.h> 20 #include <sys/disk.h> 21 #include <sys/kernel.h> 22 #include <sys/malloc.h> 23 #include <sys/sysctl.h> 24 #include <sys/linker.h> 25 #include <sys/proc.h> 26 #include <sys/buf2.h> 27 #include <sys/thread2.h> 28 #include <sys/queue.h> 29 #include <sys/udev.h> 30 31 #ifndef MD_NSECT 32 #define MD_NSECT (10000 * 2) 33 #endif 34 35 MALLOC_DEFINE(M_MD, "MD disk", "Memory Disk"); 36 MALLOC_DEFINE(M_MDSECT, "MD sectors", "Memory Disk Sectors"); 37 38 static int md_debug; 39 SYSCTL_INT(_debug, OID_AUTO, mddebug, CTLFLAG_RW, &md_debug, 0, 40 "Enable debug output for memory disk devices"); 41 42 #if defined(MD_ROOT) && defined(MD_ROOT_SIZE) 43 /* Image gets put here: */ 44 static u_char mfs_root[MD_ROOT_SIZE*1024] = "MFS Filesystem goes here"; 45 static u_char end_mfs_root[] __unused = "MFS Filesystem had better STOP here"; 46 #endif 47 48 static int mdrootready; 49 50 static d_strategy_t mdstrategy; 51 static d_strategy_t mdstrategy_preload; 52 static d_strategy_t mdstrategy_malloc; 53 static d_open_t mdopen; 54 static d_close_t mdclose; 55 static d_ioctl_t mdioctl; 56 57 static struct dev_ops md_ops = { 58 { "md", 0, D_DISK | D_CANFREE | D_MEMDISK | D_TRACKCLOSE}, 59 .d_open = mdopen, 60 .d_close = mdclose, 61 .d_read = physread, 62 .d_write = physwrite, 63 .d_ioctl = mdioctl, 64 .d_strategy = mdstrategy, 65 }; 66 67 struct md_s { 68 int unit; 69 struct devstat stats; 70 struct bio_queue_head bio_queue; 71 struct disk disk; 72 cdev_t dev; 73 int busy; 74 enum { /* Memory disk type */ 75 MD_MALLOC, 76 MD_PRELOAD 77 } type; 78 unsigned nsect; 79 80 /* MD_MALLOC related fields */ 81 unsigned nsecp; 82 u_char **secp; 83 84 /* MD_PRELOAD related fields */ 85 u_char *pl_ptr; 86 unsigned pl_len; 87 TAILQ_ENTRY(md_s) link; 88 }; 89 TAILQ_HEAD(mdshead, md_s) mdlist = TAILQ_HEAD_INITIALIZER(mdlist); 90 91 static int mdunits; 92 static int refcnt; 93 94 static struct md_s *mdcreate(unsigned); 95 static void mdcreate_malloc(void); 96 static int mdinit(module_t, int, void *); 97 static void md_drvinit(void *); 98 static int md_drvcleanup(void); 99 100 static int 101 mdinit(module_t mod, int cmd, void *arg) 102 { 103 int ret = 0; 104 105 switch(cmd) { 106 case MOD_LOAD: 107 TAILQ_INIT(&mdlist); 108 md_drvinit(NULL); 109 break; 110 case MOD_UNLOAD: 111 ret = md_drvcleanup(); 112 break; 113 default: 114 ret = EINVAL; 115 break; 116 } 117 118 return (ret); 119 } 120 121 static int 122 mdopen(struct dev_open_args *ap) 123 { 124 cdev_t dev = ap->a_head.a_dev; 125 struct md_s *sc; 126 127 if (md_debug) 128 kprintf("mdopen(%s %x %x)\n", 129 devtoname(dev), ap->a_oflags, ap->a_devtype); 130 131 sc = dev->si_drv1; 132 if (sc->unit + 1 == mdunits) 133 mdcreate_malloc(); 134 135 atomic_add_int(&refcnt, 1); 136 return (0); 137 } 138 139 static int 140 mdclose(struct dev_close_args *ap) 141 { 142 cdev_t dev = ap->a_head.a_dev; 143 struct md_s *sc; 144 145 if (md_debug) 146 kprintf("mdclose(%s %x %x)\n", 147 devtoname(dev), ap->a_fflag, ap->a_devtype); 148 sc = dev->si_drv1; 149 atomic_add_int(&refcnt, -1); 150 151 return (0); 152 } 153 154 static int 155 mdioctl(struct dev_ioctl_args *ap) 156 { 157 cdev_t dev = ap->a_head.a_dev; 158 159 if (md_debug) 160 kprintf("mdioctl(%s %lx %p %x)\n", 161 devtoname(dev), ap->a_cmd, ap->a_data, ap->a_fflag); 162 163 return (ENOIOCTL); 164 } 165 166 static int 167 mdstrategy(struct dev_strategy_args *ap) 168 { 169 cdev_t dev = ap->a_head.a_dev; 170 struct bio *bio = ap->a_bio; 171 struct buf *bp = bio->bio_buf; 172 struct md_s *sc; 173 174 if (md_debug > 1) { 175 kprintf("mdstrategy(%p) %s %08x, %lld, %d, %p)\n", 176 bp, devtoname(dev), bp->b_flags, 177 (long long)bio->bio_offset, 178 bp->b_bcount, bp->b_data); 179 } 180 bio->bio_driver_info = dev; 181 sc = dev->si_drv1; 182 if (sc->type == MD_MALLOC) { 183 mdstrategy_malloc(ap); 184 } else { 185 mdstrategy_preload(ap); 186 } 187 return(0); 188 } 189 190 191 static int 192 mdstrategy_malloc(struct dev_strategy_args *ap) 193 { 194 cdev_t dev = ap->a_head.a_dev; 195 struct bio *bio = ap->a_bio; 196 struct buf *bp = bio->bio_buf; 197 unsigned secno, nsec, secval, uc; 198 u_char *secp, **secpp, *dst; 199 struct md_s *sc; 200 int i; 201 202 if (md_debug > 1) 203 kprintf("mdstrategy_malloc(%p) %s %08xx, %lld, %d, %p)\n", 204 bp, devtoname(dev), bp->b_flags, 205 (long long)bio->bio_offset, 206 bp->b_bcount, bp->b_data); 207 208 sc = dev->si_drv1; 209 210 crit_enter(); 211 212 bioqdisksort(&sc->bio_queue, bio); 213 214 if (sc->busy) { 215 crit_exit(); 216 return(0); 217 } 218 219 sc->busy++; 220 221 while (1) { 222 bio = bioq_first(&sc->bio_queue); 223 if (bio == NULL) { 224 crit_exit(); 225 break; 226 } 227 crit_exit(); 228 bioq_remove(&sc->bio_queue, bio); 229 bp = bio->bio_buf; 230 231 devstat_start_transaction(&sc->stats); 232 233 switch (bp->b_cmd) { 234 case BUF_CMD_FREEBLKS: 235 case BUF_CMD_READ: 236 case BUF_CMD_WRITE: 237 break; 238 default: 239 panic("md: bad b_cmd %d", bp->b_cmd); 240 } 241 242 nsec = bp->b_bcount >> DEV_BSHIFT; 243 secno = (unsigned)(bio->bio_offset >> DEV_BSHIFT); 244 dst = bp->b_data; 245 while (nsec--) { 246 if (secno < sc->nsecp) { 247 secpp = &sc->secp[secno]; 248 if ((u_int)(uintptr_t)*secpp > 255) { 249 secp = *secpp; 250 secval = 0; 251 } else { 252 secp = NULL; 253 secval = (u_int)(uintptr_t)*secpp; 254 } 255 } else { 256 secpp = NULL; 257 secp = NULL; 258 secval = 0; 259 } 260 if (md_debug > 2) 261 kprintf("%08x %p %p %d\n", bp->b_flags, secpp, secp, secval); 262 263 switch (bp->b_cmd) { 264 case BUF_CMD_FREEBLKS: 265 if (secpp) { 266 if (secp) 267 kfree(secp, M_MDSECT); 268 *secpp = NULL; 269 } 270 break; 271 case BUF_CMD_READ: 272 if (secp) { 273 bcopy(secp, dst, DEV_BSIZE); 274 } else if (secval) { 275 for (i = 0; i < DEV_BSIZE; i++) 276 dst[i] = secval; 277 } else { 278 bzero(dst, DEV_BSIZE); 279 } 280 break; 281 case BUF_CMD_WRITE: 282 uc = dst[0]; 283 for (i = 1; i < DEV_BSIZE; i++) 284 if (dst[i] != uc) 285 break; 286 if (i == DEV_BSIZE && !uc) { 287 if (secp) 288 kfree(secp, M_MDSECT); 289 if (secpp) 290 *secpp = (u_char *)(uintptr_t)uc; 291 } else { 292 if (!secpp) { 293 secpp = kmalloc((secno + nsec + 1) * sizeof(u_char *), 294 M_MD, 295 M_WAITOK | M_ZERO); 296 bcopy(sc->secp, secpp, sc->nsecp * sizeof(u_char *)); 297 kfree(sc->secp, M_MD); 298 sc->secp = secpp; 299 sc->nsecp = secno + nsec + 1; 300 secpp = &sc->secp[secno]; 301 } 302 if (i == DEV_BSIZE) { 303 if (secp) 304 kfree(secp, M_MDSECT); 305 *secpp = (u_char *)(uintptr_t)uc; 306 } else { 307 if (!secp) 308 secp = kmalloc(DEV_BSIZE, 309 M_MDSECT, 310 M_WAITOK); 311 bcopy(dst, secp, DEV_BSIZE); 312 313 *secpp = secp; 314 } 315 } 316 break; 317 default: 318 panic("md: bad b_cmd %d", bp->b_cmd); 319 320 } 321 secno++; 322 dst += DEV_BSIZE; 323 } 324 bp->b_resid = 0; 325 devstat_end_transaction_buf(&sc->stats, bp); 326 biodone(bio); 327 crit_enter(); 328 } 329 sc->busy = 0; 330 return(0); 331 } 332 333 334 static int 335 mdstrategy_preload(struct dev_strategy_args *ap) 336 { 337 cdev_t dev = ap->a_head.a_dev; 338 struct bio *bio = ap->a_bio; 339 struct buf *bp = bio->bio_buf; 340 struct md_s *sc; 341 342 if (md_debug > 1) 343 kprintf("mdstrategy_preload(%p) %s %08x, %lld, %d, %p)\n", 344 bp, devtoname(dev), bp->b_flags, 345 (long long)bio->bio_offset, 346 bp->b_bcount, bp->b_data); 347 348 sc = dev->si_drv1; 349 350 crit_enter(); 351 352 bioqdisksort(&sc->bio_queue, bio); 353 354 if (sc->busy) { 355 crit_exit(); 356 return(0); 357 } 358 359 sc->busy++; 360 361 while (1) { 362 bio = bioq_first(&sc->bio_queue); 363 if (bio) 364 bioq_remove(&sc->bio_queue, bio); 365 crit_exit(); 366 if (bio == NULL) 367 break; 368 369 devstat_start_transaction(&sc->stats); 370 371 switch (bp->b_cmd) { 372 case BUF_CMD_FREEBLKS: 373 break; 374 case BUF_CMD_READ: 375 bcopy(sc->pl_ptr + bio->bio_offset, 376 bp->b_data, bp->b_bcount); 377 break; 378 case BUF_CMD_WRITE: 379 bcopy(bp->b_data, sc->pl_ptr + bio->bio_offset, 380 bp->b_bcount); 381 break; 382 default: 383 panic("md: bad cmd %d\n", bp->b_cmd); 384 } 385 bp->b_resid = 0; 386 devstat_end_transaction_buf(&sc->stats, bp); 387 biodone(bio); 388 crit_enter(); 389 } 390 sc->busy = 0; 391 return(0); 392 } 393 394 static struct md_s * 395 mdcreate(unsigned length) 396 { 397 struct md_s *sc; 398 struct disk_info info; 399 400 sc = kmalloc(sizeof(*sc), M_MD, M_WAITOK | M_ZERO); 401 sc->unit = mdunits++; 402 bioq_init(&sc->bio_queue); 403 devstat_add_entry(&sc->stats, "md", sc->unit, DEV_BSIZE, 404 DEVSTAT_NO_ORDERED_TAGS, 405 DEVSTAT_TYPE_DIRECT | DEVSTAT_TYPE_IF_OTHER, 406 DEVSTAT_PRIORITY_OTHER); 407 sc->dev = disk_create(sc->unit, &sc->disk, &md_ops); 408 sc->dev->si_drv1 = sc; 409 sc->dev->si_iosize_max = DFLTPHYS; 410 disk_setdisktype(&sc->disk, "memory"); 411 412 bzero(&info, sizeof(info)); 413 info.d_media_blksize = DEV_BSIZE; /* mandatory */ 414 info.d_media_blocks = length / DEV_BSIZE; 415 416 info.d_secpertrack = 1024; /* optional */ 417 info.d_nheads = 1; 418 info.d_secpercyl = info.d_secpertrack * info.d_nheads; 419 info.d_ncylinders = (u_int)(info.d_media_blocks / info.d_secpercyl); 420 disk_setdiskinfo(&sc->disk, &info); 421 TAILQ_INSERT_HEAD(&mdlist, sc, link); 422 423 return (sc); 424 } 425 426 427 static void 428 mdcreate_preload(u_char *image, unsigned length) 429 { 430 struct md_s *sc; 431 432 sc = mdcreate(length); 433 sc->type = MD_PRELOAD; 434 sc->nsect = length / DEV_BSIZE; 435 sc->pl_ptr = image; 436 sc->pl_len = length; 437 438 if (sc->unit == 0) 439 mdrootready = 1; 440 } 441 442 static void 443 mdcreate_malloc(void) 444 { 445 struct md_s *sc; 446 447 sc = mdcreate(MD_NSECT*DEV_BSIZE); 448 sc->type = MD_MALLOC; 449 450 sc->nsect = MD_NSECT; /* for now */ 451 sc->secp = kmalloc(sizeof(u_char *), M_MD, M_WAITOK | M_ZERO); 452 sc->nsecp = 1; 453 kprintf("md%d: Malloc disk\n", sc->unit); 454 } 455 456 static int 457 md_drvcleanup(void) 458 { 459 460 int secno; 461 struct md_s *sc, *sc_temp; 462 463 if (atomic_fetchadd_int(&refcnt, 0) != 0) 464 return EBUSY; 465 466 /* 467 * Go through all the md devices, freeing up all the 468 * memory allocated for sectors, and the md_s struct 469 * itself. 470 */ 471 TAILQ_FOREACH_MUTABLE(sc, &mdlist, link, sc_temp) { 472 for (secno = 0; secno < sc->nsecp; secno++) { 473 if ((u_int)(uintptr_t)sc->secp[secno] > 255) 474 kfree(sc->secp[secno], M_MDSECT); 475 } 476 477 if (sc->dev != NULL) 478 disk_destroy(&sc->disk); 479 480 devstat_remove_entry(&sc->stats); 481 TAILQ_REMOVE(&mdlist, sc, link); 482 483 kfree(sc->secp, M_MD); 484 kfree(sc, M_MD); 485 } 486 487 return 0; 488 489 } 490 491 static void 492 md_drvinit(void *unused) 493 { 494 495 caddr_t mod; 496 caddr_t c; 497 u_char *ptr, *name, *type; 498 unsigned len; 499 500 #ifdef MD_ROOT_SIZE 501 mdcreate_preload(mfs_root, MD_ROOT_SIZE*1024); 502 #endif 503 mod = NULL; 504 while ((mod = preload_search_next_name(mod)) != NULL) { 505 name = (char *)preload_search_info(mod, MODINFO_NAME); 506 type = (char *)preload_search_info(mod, MODINFO_TYPE); 507 if (name == NULL) 508 continue; 509 if (type == NULL) 510 continue; 511 if (strcmp(type, "md_image") && strcmp(type, "mfs_root")) 512 continue; 513 c = preload_search_info(mod, MODINFO_ADDR); 514 ptr = *(u_char **)c; 515 c = preload_search_info(mod, MODINFO_SIZE); 516 len = *(unsigned *)c; 517 kprintf("md%d: Preloaded image <%s> %d bytes at %p\n", 518 mdunits, name, len, ptr); 519 mdcreate_preload(ptr, len); 520 } 521 mdcreate_malloc(); 522 } 523 524 DEV_MODULE(md, mdinit, NULL); 525 526 #ifdef MD_ROOT 527 static void 528 md_takeroot(void *junk) 529 { 530 if (mdrootready) 531 rootdevnames[0] = "ufs:/dev/md0s0"; 532 } 533 534 SYSINIT(md_root, SI_SUB_MOUNT_ROOT, SI_ORDER_FIRST, md_takeroot, NULL); 535 #endif 536