12d1661a5SPawel Jakub Dawidek /*- 22d1661a5SPawel Jakub Dawidek * Copyright (c) 2004 Pawel Jakub Dawidek <pjd@FreeBSD.org> 32d1661a5SPawel Jakub Dawidek * All rights reserved. 42d1661a5SPawel Jakub Dawidek * 52d1661a5SPawel Jakub Dawidek * Redistribution and use in source and binary forms, with or without 62d1661a5SPawel Jakub Dawidek * modification, are permitted provided that the following conditions 72d1661a5SPawel Jakub Dawidek * are met: 82d1661a5SPawel Jakub Dawidek * 1. Redistributions of source code must retain the above copyright 92d1661a5SPawel Jakub Dawidek * notice, this list of conditions and the following disclaimer. 102d1661a5SPawel Jakub Dawidek * 2. Redistributions in binary form must reproduce the above copyright 112d1661a5SPawel Jakub Dawidek * notice, this list of conditions and the following disclaimer in the 122d1661a5SPawel Jakub Dawidek * documentation and/or other materials provided with the distribution. 132d1661a5SPawel Jakub Dawidek * 142d1661a5SPawel Jakub Dawidek * THIS SOFTWARE IS PROVIDED BY THE AUTHORS AND CONTRIBUTORS ``AS IS'' AND 152d1661a5SPawel Jakub Dawidek * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE 162d1661a5SPawel Jakub Dawidek * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE 172d1661a5SPawel Jakub Dawidek * ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHORS OR CONTRIBUTORS BE LIABLE 182d1661a5SPawel Jakub Dawidek * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL 192d1661a5SPawel Jakub Dawidek * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS 202d1661a5SPawel Jakub Dawidek * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) 212d1661a5SPawel Jakub Dawidek * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT 222d1661a5SPawel Jakub Dawidek * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY 232d1661a5SPawel Jakub Dawidek * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF 242d1661a5SPawel Jakub Dawidek * SUCH DAMAGE. 252d1661a5SPawel Jakub Dawidek */ 262d1661a5SPawel Jakub Dawidek 272d1661a5SPawel Jakub Dawidek #include <sys/cdefs.h> 282d1661a5SPawel Jakub Dawidek __FBSDID("$FreeBSD$"); 292d1661a5SPawel Jakub Dawidek 302d1661a5SPawel Jakub Dawidek #include <sys/param.h> 312d1661a5SPawel Jakub Dawidek #include <sys/systm.h> 322d1661a5SPawel Jakub Dawidek #include <sys/kernel.h> 332d1661a5SPawel Jakub Dawidek #include <sys/module.h> 342d1661a5SPawel Jakub Dawidek #include <sys/limits.h> 352d1661a5SPawel Jakub Dawidek #include <sys/lock.h> 362d1661a5SPawel Jakub Dawidek #include <sys/mutex.h> 372d1661a5SPawel Jakub Dawidek #include <sys/bio.h> 382d1661a5SPawel Jakub Dawidek #include <sys/sysctl.h> 392d1661a5SPawel Jakub Dawidek #include <sys/malloc.h> 402d1661a5SPawel Jakub Dawidek #include <sys/bitstring.h> 412d1661a5SPawel Jakub Dawidek #include <vm/uma.h> 422d1661a5SPawel Jakub Dawidek #include <machine/atomic.h> 432d1661a5SPawel Jakub Dawidek #include <geom/geom.h> 442d1661a5SPawel Jakub Dawidek #include <sys/proc.h> 452d1661a5SPawel Jakub Dawidek #include <sys/kthread.h> 462d1661a5SPawel Jakub Dawidek #include <geom/raid3/g_raid3.h> 472d1661a5SPawel Jakub Dawidek 482d1661a5SPawel Jakub Dawidek 492d1661a5SPawel Jakub Dawidek static MALLOC_DEFINE(M_RAID3, "raid3 data", "GEOM_RAID3 Data"); 502d1661a5SPawel Jakub Dawidek 512d1661a5SPawel Jakub Dawidek SYSCTL_DECL(_kern_geom); 522d1661a5SPawel Jakub Dawidek SYSCTL_NODE(_kern_geom, OID_AUTO, raid3, CTLFLAG_RW, 0, "GEOM_RAID3 stuff"); 53809a9dc6SPawel Jakub Dawidek u_int g_raid3_debug = 0; 542d1661a5SPawel Jakub Dawidek SYSCTL_UINT(_kern_geom_raid3, OID_AUTO, debug, CTLFLAG_RW, &g_raid3_debug, 0, 552d1661a5SPawel Jakub Dawidek "Debug level"); 562d1661a5SPawel Jakub Dawidek static u_int g_raid3_timeout = 8; 572d1661a5SPawel Jakub Dawidek SYSCTL_UINT(_kern_geom_raid3, OID_AUTO, timeout, CTLFLAG_RW, &g_raid3_timeout, 582d1661a5SPawel Jakub Dawidek 0, "Time to wait on all raid3 components"); 592d1661a5SPawel Jakub Dawidek static u_int g_raid3_reqs_per_sync = 5; 602d1661a5SPawel Jakub Dawidek SYSCTL_UINT(_kern_geom_raid3, OID_AUTO, reqs_per_sync, CTLFLAG_RW, 612d1661a5SPawel Jakub Dawidek &g_raid3_reqs_per_sync, 0, 622d1661a5SPawel Jakub Dawidek "Number of regular I/O requests per synchronization request"); 632d1661a5SPawel Jakub Dawidek static u_int g_raid3_syncs_per_sec = 100; 642d1661a5SPawel Jakub Dawidek SYSCTL_UINT(_kern_geom_raid3, OID_AUTO, syncs_per_sec, CTLFLAG_RW, 652d1661a5SPawel Jakub Dawidek &g_raid3_syncs_per_sec, 0, 662d1661a5SPawel Jakub Dawidek "Number of synchronizations requests per second"); 672d1661a5SPawel Jakub Dawidek 682d1661a5SPawel Jakub Dawidek static u_int g_raid3_n64k = 50; 692d1661a5SPawel Jakub Dawidek TUNABLE_INT("kern.geom.raid3.n64k", &g_raid3_n64k); 702d1661a5SPawel Jakub Dawidek SYSCTL_UINT(_kern_geom_raid3, OID_AUTO, n64k, CTLFLAG_RD, &g_raid3_n64k, 0, 712d1661a5SPawel Jakub Dawidek "Maximum number of 64kB allocations"); 722d1661a5SPawel Jakub Dawidek static u_int g_raid3_n16k = 200; 732d1661a5SPawel Jakub Dawidek TUNABLE_INT("kern.geom.raid3.n16k", &g_raid3_n16k); 742d1661a5SPawel Jakub Dawidek SYSCTL_UINT(_kern_geom_raid3, OID_AUTO, n16k, CTLFLAG_RD, &g_raid3_n16k, 0, 752d1661a5SPawel Jakub Dawidek "Maximum number of 16kB allocations"); 762d1661a5SPawel Jakub Dawidek static u_int g_raid3_n4k = 1200; 772d1661a5SPawel Jakub Dawidek TUNABLE_INT("kern.geom.raid3.n4k", &g_raid3_n4k); 782d1661a5SPawel Jakub Dawidek SYSCTL_UINT(_kern_geom_raid3, OID_AUTO, n4k, CTLFLAG_RD, &g_raid3_n4k, 0, 792d1661a5SPawel Jakub Dawidek "Maximum number of 4kB allocations"); 802d1661a5SPawel Jakub Dawidek 812d1661a5SPawel Jakub Dawidek SYSCTL_NODE(_kern_geom_raid3, OID_AUTO, stat, CTLFLAG_RW, 0, 822d1661a5SPawel Jakub Dawidek "GEOM_RAID3 statistics"); 83dba915cfSPawel Jakub Dawidek static u_int g_raid3_parity_mismatch = 0; 84dba915cfSPawel Jakub Dawidek SYSCTL_UINT(_kern_geom_raid3_stat, OID_AUTO, parity_mismatch, CTLFLAG_RD, 85dba915cfSPawel Jakub Dawidek &g_raid3_parity_mismatch, 0, "Number of failures in VERIFY mode"); 862d1661a5SPawel Jakub Dawidek static u_int g_raid3_64k_requested = 0; 872d1661a5SPawel Jakub Dawidek SYSCTL_UINT(_kern_geom_raid3_stat, OID_AUTO, 64k_requested, CTLFLAG_RD, 882d1661a5SPawel Jakub Dawidek &g_raid3_64k_requested, 0, "Number of requested 64kB allocations"); 892d1661a5SPawel Jakub Dawidek static u_int g_raid3_64k_failed = 0; 902d1661a5SPawel Jakub Dawidek SYSCTL_UINT(_kern_geom_raid3_stat, OID_AUTO, 64k_failed, CTLFLAG_RD, 912d1661a5SPawel Jakub Dawidek &g_raid3_64k_failed, 0, "Number of failed 64kB allocations"); 922d1661a5SPawel Jakub Dawidek static u_int g_raid3_16k_requested = 0; 932d1661a5SPawel Jakub Dawidek SYSCTL_UINT(_kern_geom_raid3_stat, OID_AUTO, 16k_requested, CTLFLAG_RD, 942d1661a5SPawel Jakub Dawidek &g_raid3_16k_requested, 0, "Number of requested 16kB allocations"); 952d1661a5SPawel Jakub Dawidek static u_int g_raid3_16k_failed = 0; 962d1661a5SPawel Jakub Dawidek SYSCTL_UINT(_kern_geom_raid3_stat, OID_AUTO, 16k_failed, CTLFLAG_RD, 972d1661a5SPawel Jakub Dawidek &g_raid3_16k_failed, 0, "Number of failed 16kB allocations"); 982d1661a5SPawel Jakub Dawidek static u_int g_raid3_4k_requested = 0; 992d1661a5SPawel Jakub Dawidek SYSCTL_UINT(_kern_geom_raid3_stat, OID_AUTO, 4k_requested, CTLFLAG_RD, 1002d1661a5SPawel Jakub Dawidek &g_raid3_4k_requested, 0, "Number of requested 4kB allocations"); 1012d1661a5SPawel Jakub Dawidek static u_int g_raid3_4k_failed = 0; 1022d1661a5SPawel Jakub Dawidek SYSCTL_UINT(_kern_geom_raid3_stat, OID_AUTO, 4k_failed, CTLFLAG_RD, 1032d1661a5SPawel Jakub Dawidek &g_raid3_4k_failed, 0, "Number of failed 4kB allocations"); 1042d1661a5SPawel Jakub Dawidek 1052d1661a5SPawel Jakub Dawidek #define MSLEEP(ident, mtx, priority, wmesg, timeout) do { \ 1062d1661a5SPawel Jakub Dawidek G_RAID3_DEBUG(4, "%s: Sleeping %p.", __func__, (ident)); \ 1072d1661a5SPawel Jakub Dawidek msleep((ident), (mtx), (priority), (wmesg), (timeout)); \ 1082d1661a5SPawel Jakub Dawidek G_RAID3_DEBUG(4, "%s: Woken up %p.", __func__, (ident)); \ 1092d1661a5SPawel Jakub Dawidek } while (0) 1102d1661a5SPawel Jakub Dawidek 1112d1661a5SPawel Jakub Dawidek 1122d1661a5SPawel Jakub Dawidek static int g_raid3_destroy_geom(struct gctl_req *req, struct g_class *mp, 1132d1661a5SPawel Jakub Dawidek struct g_geom *gp); 1142d1661a5SPawel Jakub Dawidek static g_taste_t g_raid3_taste; 1152d1661a5SPawel Jakub Dawidek 1162d1661a5SPawel Jakub Dawidek struct g_class g_raid3_class = { 1172d1661a5SPawel Jakub Dawidek .name = G_RAID3_CLASS_NAME, 1182d1661a5SPawel Jakub Dawidek .version = G_VERSION, 1192d1661a5SPawel Jakub Dawidek .ctlreq = g_raid3_config, 1202d1661a5SPawel Jakub Dawidek .taste = g_raid3_taste, 1212d1661a5SPawel Jakub Dawidek .destroy_geom = g_raid3_destroy_geom 1222d1661a5SPawel Jakub Dawidek }; 1232d1661a5SPawel Jakub Dawidek 1242d1661a5SPawel Jakub Dawidek 1252d1661a5SPawel Jakub Dawidek static void g_raid3_destroy_provider(struct g_raid3_softc *sc); 1262d1661a5SPawel Jakub Dawidek static int g_raid3_update_disk(struct g_raid3_disk *disk, u_int state); 1272d1661a5SPawel Jakub Dawidek static void g_raid3_update_device(struct g_raid3_softc *sc, boolean_t force); 1282d1661a5SPawel Jakub Dawidek static void g_raid3_dumpconf(struct sbuf *sb, const char *indent, 1292d1661a5SPawel Jakub Dawidek struct g_geom *gp, struct g_consumer *cp, struct g_provider *pp); 1302d1661a5SPawel Jakub Dawidek static void g_raid3_sync_stop(struct g_raid3_softc *sc, int type); 1312d1661a5SPawel Jakub Dawidek 1322d1661a5SPawel Jakub Dawidek 1332d1661a5SPawel Jakub Dawidek /* 1342d1661a5SPawel Jakub Dawidek * XXX: it should be placed in subr_disk.c. 1352d1661a5SPawel Jakub Dawidek */ 1362d1661a5SPawel Jakub Dawidek static void 1372d1661a5SPawel Jakub Dawidek bioq_insert_head(struct bio_queue_head *head, struct bio *bp) 1382d1661a5SPawel Jakub Dawidek { 1392d1661a5SPawel Jakub Dawidek 1402d1661a5SPawel Jakub Dawidek TAILQ_INSERT_HEAD(&head->queue, bp, bio_queue); 1412d1661a5SPawel Jakub Dawidek } 1422d1661a5SPawel Jakub Dawidek 1432d1661a5SPawel Jakub Dawidek static const char * 1442d1661a5SPawel Jakub Dawidek g_raid3_disk_state2str(int state) 1452d1661a5SPawel Jakub Dawidek { 1462d1661a5SPawel Jakub Dawidek 1472d1661a5SPawel Jakub Dawidek switch (state) { 1482d1661a5SPawel Jakub Dawidek case G_RAID3_DISK_STATE_NODISK: 1492d1661a5SPawel Jakub Dawidek return ("NODISK"); 1502d1661a5SPawel Jakub Dawidek case G_RAID3_DISK_STATE_NONE: 1512d1661a5SPawel Jakub Dawidek return ("NONE"); 1522d1661a5SPawel Jakub Dawidek case G_RAID3_DISK_STATE_NEW: 1532d1661a5SPawel Jakub Dawidek return ("NEW"); 1542d1661a5SPawel Jakub Dawidek case G_RAID3_DISK_STATE_ACTIVE: 1552d1661a5SPawel Jakub Dawidek return ("ACTIVE"); 1562d1661a5SPawel Jakub Dawidek case G_RAID3_DISK_STATE_STALE: 1572d1661a5SPawel Jakub Dawidek return ("STALE"); 1582d1661a5SPawel Jakub Dawidek case G_RAID3_DISK_STATE_SYNCHRONIZING: 1592d1661a5SPawel Jakub Dawidek return ("SYNCHRONIZING"); 1602d1661a5SPawel Jakub Dawidek case G_RAID3_DISK_STATE_DISCONNECTED: 1612d1661a5SPawel Jakub Dawidek return ("DISCONNECTED"); 1622d1661a5SPawel Jakub Dawidek default: 1632d1661a5SPawel Jakub Dawidek return ("INVALID"); 1642d1661a5SPawel Jakub Dawidek } 1652d1661a5SPawel Jakub Dawidek } 1662d1661a5SPawel Jakub Dawidek 1672d1661a5SPawel Jakub Dawidek static const char * 1682d1661a5SPawel Jakub Dawidek g_raid3_device_state2str(int state) 1692d1661a5SPawel Jakub Dawidek { 1702d1661a5SPawel Jakub Dawidek 1712d1661a5SPawel Jakub Dawidek switch (state) { 1722d1661a5SPawel Jakub Dawidek case G_RAID3_DEVICE_STATE_STARTING: 1732d1661a5SPawel Jakub Dawidek return ("STARTING"); 1742d1661a5SPawel Jakub Dawidek case G_RAID3_DEVICE_STATE_DEGRADED: 1752d1661a5SPawel Jakub Dawidek return ("DEGRADED"); 1762d1661a5SPawel Jakub Dawidek case G_RAID3_DEVICE_STATE_COMPLETE: 1772d1661a5SPawel Jakub Dawidek return ("COMPLETE"); 1782d1661a5SPawel Jakub Dawidek default: 1792d1661a5SPawel Jakub Dawidek return ("INVALID"); 1802d1661a5SPawel Jakub Dawidek } 1812d1661a5SPawel Jakub Dawidek } 1822d1661a5SPawel Jakub Dawidek 1832d1661a5SPawel Jakub Dawidek const char * 1842d1661a5SPawel Jakub Dawidek g_raid3_get_diskname(struct g_raid3_disk *disk) 1852d1661a5SPawel Jakub Dawidek { 1862d1661a5SPawel Jakub Dawidek 1872d1661a5SPawel Jakub Dawidek if (disk->d_consumer == NULL || disk->d_consumer->provider == NULL) 1882d1661a5SPawel Jakub Dawidek return ("[unknown]"); 1892d1661a5SPawel Jakub Dawidek return (disk->d_name); 1902d1661a5SPawel Jakub Dawidek } 1912d1661a5SPawel Jakub Dawidek 1922d1661a5SPawel Jakub Dawidek #define g_raid3_xor(src1, src2, dst, size) \ 1932d1661a5SPawel Jakub Dawidek _g_raid3_xor((uint64_t *)(src1), (uint64_t *)(src2), \ 1942d1661a5SPawel Jakub Dawidek (uint64_t *)(dst), (size_t)size) 1952d1661a5SPawel Jakub Dawidek static void 1962d1661a5SPawel Jakub Dawidek _g_raid3_xor(uint64_t *src1, uint64_t *src2, uint64_t *dst, size_t size) 1972d1661a5SPawel Jakub Dawidek { 1982d1661a5SPawel Jakub Dawidek 1992d1661a5SPawel Jakub Dawidek KASSERT((size % 128) == 0, ("Invalid size: %zu.", size)); 2002d1661a5SPawel Jakub Dawidek for (; size > 0; size -= 128) { 2012d1661a5SPawel Jakub Dawidek *dst++ = (*src1++) ^ (*src2++); 2022d1661a5SPawel Jakub Dawidek *dst++ = (*src1++) ^ (*src2++); 2032d1661a5SPawel Jakub Dawidek *dst++ = (*src1++) ^ (*src2++); 2042d1661a5SPawel Jakub Dawidek *dst++ = (*src1++) ^ (*src2++); 2052d1661a5SPawel Jakub Dawidek *dst++ = (*src1++) ^ (*src2++); 2062d1661a5SPawel Jakub Dawidek *dst++ = (*src1++) ^ (*src2++); 2072d1661a5SPawel Jakub Dawidek *dst++ = (*src1++) ^ (*src2++); 2082d1661a5SPawel Jakub Dawidek *dst++ = (*src1++) ^ (*src2++); 2092d1661a5SPawel Jakub Dawidek *dst++ = (*src1++) ^ (*src2++); 2102d1661a5SPawel Jakub Dawidek *dst++ = (*src1++) ^ (*src2++); 2112d1661a5SPawel Jakub Dawidek *dst++ = (*src1++) ^ (*src2++); 2122d1661a5SPawel Jakub Dawidek *dst++ = (*src1++) ^ (*src2++); 2132d1661a5SPawel Jakub Dawidek *dst++ = (*src1++) ^ (*src2++); 2142d1661a5SPawel Jakub Dawidek *dst++ = (*src1++) ^ (*src2++); 2152d1661a5SPawel Jakub Dawidek *dst++ = (*src1++) ^ (*src2++); 2162d1661a5SPawel Jakub Dawidek *dst++ = (*src1++) ^ (*src2++); 2172d1661a5SPawel Jakub Dawidek } 2182d1661a5SPawel Jakub Dawidek } 2192d1661a5SPawel Jakub Dawidek 220dba915cfSPawel Jakub Dawidek static int 221dba915cfSPawel Jakub Dawidek g_raid3_is_zero(struct bio *bp) 222dba915cfSPawel Jakub Dawidek { 223dba915cfSPawel Jakub Dawidek static const uint64_t zeros[] = { 224dba915cfSPawel Jakub Dawidek 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 225dba915cfSPawel Jakub Dawidek }; 226dba915cfSPawel Jakub Dawidek u_char *addr; 227dba915cfSPawel Jakub Dawidek ssize_t size; 228dba915cfSPawel Jakub Dawidek 229dba915cfSPawel Jakub Dawidek size = bp->bio_length; 230dba915cfSPawel Jakub Dawidek addr = (u_char *)bp->bio_data; 231dba915cfSPawel Jakub Dawidek for (; size > 0; size -= sizeof(zeros), addr += sizeof(zeros)) { 232dba915cfSPawel Jakub Dawidek if (bcmp(addr, zeros, sizeof(zeros)) != 0) 233dba915cfSPawel Jakub Dawidek return (0); 234dba915cfSPawel Jakub Dawidek } 235dba915cfSPawel Jakub Dawidek return (1); 236dba915cfSPawel Jakub Dawidek } 237dba915cfSPawel Jakub Dawidek 2382d1661a5SPawel Jakub Dawidek /* 2392d1661a5SPawel Jakub Dawidek * --- Events handling functions --- 2402d1661a5SPawel Jakub Dawidek * Events in geom_raid3 are used to maintain disks and device status 2412d1661a5SPawel Jakub Dawidek * from one thread to simplify locking. 2422d1661a5SPawel Jakub Dawidek */ 2432d1661a5SPawel Jakub Dawidek static void 2442d1661a5SPawel Jakub Dawidek g_raid3_event_free(struct g_raid3_event *ep) 2452d1661a5SPawel Jakub Dawidek { 2462d1661a5SPawel Jakub Dawidek 2472d1661a5SPawel Jakub Dawidek free(ep, M_RAID3); 2482d1661a5SPawel Jakub Dawidek } 2492d1661a5SPawel Jakub Dawidek 2502d1661a5SPawel Jakub Dawidek int 2512d1661a5SPawel Jakub Dawidek g_raid3_event_send(void *arg, int state, int flags) 2522d1661a5SPawel Jakub Dawidek { 2532d1661a5SPawel Jakub Dawidek struct g_raid3_softc *sc; 2542d1661a5SPawel Jakub Dawidek struct g_raid3_disk *disk; 2552d1661a5SPawel Jakub Dawidek struct g_raid3_event *ep; 2562d1661a5SPawel Jakub Dawidek int error; 2572d1661a5SPawel Jakub Dawidek 2582d1661a5SPawel Jakub Dawidek ep = malloc(sizeof(*ep), M_RAID3, M_WAITOK); 2592d1661a5SPawel Jakub Dawidek G_RAID3_DEBUG(4, "%s: Sending event %p.", __func__, ep); 2602d1661a5SPawel Jakub Dawidek if ((flags & G_RAID3_EVENT_DEVICE) != 0) { 2612d1661a5SPawel Jakub Dawidek disk = NULL; 2622d1661a5SPawel Jakub Dawidek sc = arg; 2632d1661a5SPawel Jakub Dawidek } else { 2642d1661a5SPawel Jakub Dawidek disk = arg; 2652d1661a5SPawel Jakub Dawidek sc = disk->d_softc; 2662d1661a5SPawel Jakub Dawidek } 2672d1661a5SPawel Jakub Dawidek ep->e_disk = disk; 2682d1661a5SPawel Jakub Dawidek ep->e_state = state; 2692d1661a5SPawel Jakub Dawidek ep->e_flags = flags; 2702d1661a5SPawel Jakub Dawidek ep->e_error = 0; 2712d1661a5SPawel Jakub Dawidek mtx_lock(&sc->sc_events_mtx); 2722d1661a5SPawel Jakub Dawidek TAILQ_INSERT_TAIL(&sc->sc_events, ep, e_next); 2732d1661a5SPawel Jakub Dawidek mtx_unlock(&sc->sc_events_mtx); 2742d1661a5SPawel Jakub Dawidek G_RAID3_DEBUG(4, "%s: Waking up %p.", __func__, sc); 2752d1661a5SPawel Jakub Dawidek mtx_lock(&sc->sc_queue_mtx); 2762d1661a5SPawel Jakub Dawidek wakeup(sc); 2772d1661a5SPawel Jakub Dawidek wakeup(&sc->sc_queue); 2782d1661a5SPawel Jakub Dawidek mtx_unlock(&sc->sc_queue_mtx); 2792d1661a5SPawel Jakub Dawidek if ((flags & G_RAID3_EVENT_DONTWAIT) != 0) 2802d1661a5SPawel Jakub Dawidek return (0); 2812d1661a5SPawel Jakub Dawidek g_topology_assert(); 2822d1661a5SPawel Jakub Dawidek G_RAID3_DEBUG(4, "%s: Sleeping %p.", __func__, ep); 2832d1661a5SPawel Jakub Dawidek g_topology_unlock(); 2842d1661a5SPawel Jakub Dawidek while ((ep->e_flags & G_RAID3_EVENT_DONE) == 0) { 2852d1661a5SPawel Jakub Dawidek mtx_lock(&sc->sc_events_mtx); 2862d1661a5SPawel Jakub Dawidek MSLEEP(ep, &sc->sc_events_mtx, PRIBIO | PDROP, "r3:event", 2872d1661a5SPawel Jakub Dawidek hz * 5); 2882d1661a5SPawel Jakub Dawidek } 2892d1661a5SPawel Jakub Dawidek /* Don't even try to use 'sc' here, because it could be already dead. */ 2902d1661a5SPawel Jakub Dawidek g_topology_lock(); 2912d1661a5SPawel Jakub Dawidek error = ep->e_error; 2922d1661a5SPawel Jakub Dawidek g_raid3_event_free(ep); 2932d1661a5SPawel Jakub Dawidek return (error); 2942d1661a5SPawel Jakub Dawidek } 2952d1661a5SPawel Jakub Dawidek 2962d1661a5SPawel Jakub Dawidek static struct g_raid3_event * 2972d1661a5SPawel Jakub Dawidek g_raid3_event_get(struct g_raid3_softc *sc) 2982d1661a5SPawel Jakub Dawidek { 2992d1661a5SPawel Jakub Dawidek struct g_raid3_event *ep; 3002d1661a5SPawel Jakub Dawidek 3012d1661a5SPawel Jakub Dawidek mtx_lock(&sc->sc_events_mtx); 3022d1661a5SPawel Jakub Dawidek ep = TAILQ_FIRST(&sc->sc_events); 3032d1661a5SPawel Jakub Dawidek if (ep != NULL) 3042d1661a5SPawel Jakub Dawidek TAILQ_REMOVE(&sc->sc_events, ep, e_next); 3052d1661a5SPawel Jakub Dawidek mtx_unlock(&sc->sc_events_mtx); 3062d1661a5SPawel Jakub Dawidek return (ep); 3072d1661a5SPawel Jakub Dawidek } 3082d1661a5SPawel Jakub Dawidek 3092d1661a5SPawel Jakub Dawidek static void 3102d1661a5SPawel Jakub Dawidek g_raid3_event_cancel(struct g_raid3_disk *disk) 3112d1661a5SPawel Jakub Dawidek { 3122d1661a5SPawel Jakub Dawidek struct g_raid3_softc *sc; 3132d1661a5SPawel Jakub Dawidek struct g_raid3_event *ep, *tmpep; 3142d1661a5SPawel Jakub Dawidek 3152d1661a5SPawel Jakub Dawidek g_topology_assert(); 3162d1661a5SPawel Jakub Dawidek 3172d1661a5SPawel Jakub Dawidek sc = disk->d_softc; 3182d1661a5SPawel Jakub Dawidek mtx_lock(&sc->sc_events_mtx); 3192d1661a5SPawel Jakub Dawidek TAILQ_FOREACH_SAFE(ep, &sc->sc_events, e_next, tmpep) { 3202d1661a5SPawel Jakub Dawidek if ((ep->e_flags & G_RAID3_EVENT_DEVICE) != 0) 3212d1661a5SPawel Jakub Dawidek continue; 3222d1661a5SPawel Jakub Dawidek if (ep->e_disk != disk) 3232d1661a5SPawel Jakub Dawidek continue; 3242d1661a5SPawel Jakub Dawidek TAILQ_REMOVE(&sc->sc_events, ep, e_next); 3252d1661a5SPawel Jakub Dawidek if ((ep->e_flags & G_RAID3_EVENT_DONTWAIT) != 0) 3262d1661a5SPawel Jakub Dawidek g_raid3_event_free(ep); 3272d1661a5SPawel Jakub Dawidek else { 3282d1661a5SPawel Jakub Dawidek ep->e_error = ECANCELED; 3292d1661a5SPawel Jakub Dawidek wakeup(ep); 3302d1661a5SPawel Jakub Dawidek } 3312d1661a5SPawel Jakub Dawidek } 3322d1661a5SPawel Jakub Dawidek mtx_unlock(&sc->sc_events_mtx); 3332d1661a5SPawel Jakub Dawidek } 3342d1661a5SPawel Jakub Dawidek 3352d1661a5SPawel Jakub Dawidek /* 3362d1661a5SPawel Jakub Dawidek * Return the number of disks in the given state. 3372d1661a5SPawel Jakub Dawidek * If state is equal to -1, count all connected disks. 3382d1661a5SPawel Jakub Dawidek */ 3392d1661a5SPawel Jakub Dawidek u_int 3402d1661a5SPawel Jakub Dawidek g_raid3_ndisks(struct g_raid3_softc *sc, int state) 3412d1661a5SPawel Jakub Dawidek { 3422d1661a5SPawel Jakub Dawidek struct g_raid3_disk *disk; 343fa6a7837SDavid E. O'Brien u_int n, ndisks; 3442d1661a5SPawel Jakub Dawidek 345fa6a7837SDavid E. O'Brien for (n = ndisks = 0; n < sc->sc_ndisks; n++) { 3462d1661a5SPawel Jakub Dawidek disk = &sc->sc_disks[n]; 3472d1661a5SPawel Jakub Dawidek if (disk->d_state == G_RAID3_DISK_STATE_NODISK) 3482d1661a5SPawel Jakub Dawidek continue; 3492d1661a5SPawel Jakub Dawidek if (state == -1 || disk->d_state == state) 3502d1661a5SPawel Jakub Dawidek ndisks++; 3512d1661a5SPawel Jakub Dawidek } 3522d1661a5SPawel Jakub Dawidek return (ndisks); 3532d1661a5SPawel Jakub Dawidek } 3542d1661a5SPawel Jakub Dawidek 3552d1661a5SPawel Jakub Dawidek static u_int 3562d1661a5SPawel Jakub Dawidek g_raid3_nrequests(struct g_raid3_softc *sc, struct g_consumer *cp) 3572d1661a5SPawel Jakub Dawidek { 3582d1661a5SPawel Jakub Dawidek struct bio *bp; 3592d1661a5SPawel Jakub Dawidek u_int nreqs = 0; 3602d1661a5SPawel Jakub Dawidek 3612d1661a5SPawel Jakub Dawidek mtx_lock(&sc->sc_queue_mtx); 3622d1661a5SPawel Jakub Dawidek TAILQ_FOREACH(bp, &sc->sc_queue.queue, bio_queue) { 3632d1661a5SPawel Jakub Dawidek if (bp->bio_from == cp) 3642d1661a5SPawel Jakub Dawidek nreqs++; 3652d1661a5SPawel Jakub Dawidek } 3662d1661a5SPawel Jakub Dawidek mtx_unlock(&sc->sc_queue_mtx); 3672d1661a5SPawel Jakub Dawidek return (nreqs); 3682d1661a5SPawel Jakub Dawidek } 3692d1661a5SPawel Jakub Dawidek 3702d1661a5SPawel Jakub Dawidek static int 3712d1661a5SPawel Jakub Dawidek g_raid3_is_busy(struct g_raid3_softc *sc, struct g_consumer *cp) 3722d1661a5SPawel Jakub Dawidek { 3732d1661a5SPawel Jakub Dawidek 3742d1661a5SPawel Jakub Dawidek if (cp->nstart != cp->nend) { 3752d1661a5SPawel Jakub Dawidek G_RAID3_DEBUG(2, 3762d1661a5SPawel Jakub Dawidek "I/O requests for %s exist, can't destroy it now.", 3772d1661a5SPawel Jakub Dawidek cp->provider->name); 3782d1661a5SPawel Jakub Dawidek return (1); 3792d1661a5SPawel Jakub Dawidek } 3802d1661a5SPawel Jakub Dawidek if (g_raid3_nrequests(sc, cp) > 0) { 3812d1661a5SPawel Jakub Dawidek G_RAID3_DEBUG(2, 3822d1661a5SPawel Jakub Dawidek "I/O requests for %s in queue, can't destroy it now.", 3832d1661a5SPawel Jakub Dawidek cp->provider->name); 3842d1661a5SPawel Jakub Dawidek return (1); 3852d1661a5SPawel Jakub Dawidek } 3862d1661a5SPawel Jakub Dawidek return (0); 3872d1661a5SPawel Jakub Dawidek } 3882d1661a5SPawel Jakub Dawidek 3892d1661a5SPawel Jakub Dawidek static void 3902d1661a5SPawel Jakub Dawidek g_raid3_kill_consumer(struct g_raid3_softc *sc, struct g_consumer *cp) 3912d1661a5SPawel Jakub Dawidek { 3922d1661a5SPawel Jakub Dawidek 3932d1661a5SPawel Jakub Dawidek g_topology_assert(); 3942d1661a5SPawel Jakub Dawidek 3952d1661a5SPawel Jakub Dawidek cp->private = NULL; 3962d1661a5SPawel Jakub Dawidek if (g_raid3_is_busy(sc, cp)) 3972d1661a5SPawel Jakub Dawidek return; 3982d1661a5SPawel Jakub Dawidek G_RAID3_DEBUG(2, "Consumer %s destroyed.", cp->provider->name); 3992d1661a5SPawel Jakub Dawidek g_detach(cp); 4002d1661a5SPawel Jakub Dawidek g_destroy_consumer(cp); 4012d1661a5SPawel Jakub Dawidek } 4022d1661a5SPawel Jakub Dawidek 4032d1661a5SPawel Jakub Dawidek static int 4042d1661a5SPawel Jakub Dawidek g_raid3_connect_disk(struct g_raid3_disk *disk, struct g_provider *pp) 4052d1661a5SPawel Jakub Dawidek { 4062d1661a5SPawel Jakub Dawidek int error; 4072d1661a5SPawel Jakub Dawidek 4082d1661a5SPawel Jakub Dawidek g_topology_assert(); 4092d1661a5SPawel Jakub Dawidek KASSERT(disk->d_consumer == NULL, 4102d1661a5SPawel Jakub Dawidek ("Disk already connected (device %s).", disk->d_softc->sc_name)); 4112d1661a5SPawel Jakub Dawidek 4122d1661a5SPawel Jakub Dawidek disk->d_consumer = g_new_consumer(disk->d_softc->sc_geom); 4132d1661a5SPawel Jakub Dawidek disk->d_consumer->private = disk; 4142d1661a5SPawel Jakub Dawidek error = g_attach(disk->d_consumer, pp); 4152d1661a5SPawel Jakub Dawidek if (error != 0) 4162d1661a5SPawel Jakub Dawidek return (error); 4172d1661a5SPawel Jakub Dawidek G_RAID3_DEBUG(2, "Disk %s connected.", g_raid3_get_diskname(disk)); 4182d1661a5SPawel Jakub Dawidek return (0); 4192d1661a5SPawel Jakub Dawidek } 4202d1661a5SPawel Jakub Dawidek 4212d1661a5SPawel Jakub Dawidek static void 4222d1661a5SPawel Jakub Dawidek g_raid3_disconnect_consumer(struct g_raid3_softc *sc, struct g_consumer *cp) 4232d1661a5SPawel Jakub Dawidek { 4242d1661a5SPawel Jakub Dawidek 4252d1661a5SPawel Jakub Dawidek g_topology_assert(); 4262d1661a5SPawel Jakub Dawidek 4272d1661a5SPawel Jakub Dawidek if (cp == NULL) 4282d1661a5SPawel Jakub Dawidek return; 4292d1661a5SPawel Jakub Dawidek if (cp->provider != NULL) { 4302d1661a5SPawel Jakub Dawidek G_RAID3_DEBUG(2, "Disk %s disconnected.", cp->provider->name); 4312d1661a5SPawel Jakub Dawidek if (cp->acr > 0 || cp->acw > 0 || cp->ace > 0) { 4322d1661a5SPawel Jakub Dawidek G_RAID3_DEBUG(2, "Access %s r%dw%de%d = %d", 4332d1661a5SPawel Jakub Dawidek cp->provider->name, -cp->acr, -cp->acw, -cp->ace, 4342d1661a5SPawel Jakub Dawidek 0); 4352d1661a5SPawel Jakub Dawidek g_access(cp, -cp->acr, -cp->acw, -cp->ace); 4362d1661a5SPawel Jakub Dawidek } 4372d1661a5SPawel Jakub Dawidek g_raid3_kill_consumer(sc, cp); 4382d1661a5SPawel Jakub Dawidek } else { 4392d1661a5SPawel Jakub Dawidek g_destroy_consumer(cp); 4402d1661a5SPawel Jakub Dawidek } 4412d1661a5SPawel Jakub Dawidek } 4422d1661a5SPawel Jakub Dawidek 4432d1661a5SPawel Jakub Dawidek /* 4442d1661a5SPawel Jakub Dawidek * Initialize disk. This means allocate memory, create consumer, attach it 4452d1661a5SPawel Jakub Dawidek * to the provider and open access (r1w1e1) to it. 4462d1661a5SPawel Jakub Dawidek */ 4472d1661a5SPawel Jakub Dawidek static struct g_raid3_disk * 4482d1661a5SPawel Jakub Dawidek g_raid3_init_disk(struct g_raid3_softc *sc, struct g_provider *pp, 4492d1661a5SPawel Jakub Dawidek struct g_raid3_metadata *md, int *errorp) 4502d1661a5SPawel Jakub Dawidek { 4512d1661a5SPawel Jakub Dawidek struct g_raid3_disk *disk; 4522d1661a5SPawel Jakub Dawidek int error; 4532d1661a5SPawel Jakub Dawidek 4542d1661a5SPawel Jakub Dawidek disk = &sc->sc_disks[md->md_no]; 4552d1661a5SPawel Jakub Dawidek disk->d_softc = sc; 4562d1661a5SPawel Jakub Dawidek error = g_raid3_connect_disk(disk, pp); 4572d1661a5SPawel Jakub Dawidek if (error != 0) 4582d1661a5SPawel Jakub Dawidek goto fail; 4592d1661a5SPawel Jakub Dawidek disk->d_no = md->md_no; 4602d1661a5SPawel Jakub Dawidek disk->d_state = G_RAID3_DISK_STATE_NONE; 4612d1661a5SPawel Jakub Dawidek disk->d_flags = md->md_dflags; 4622d1661a5SPawel Jakub Dawidek if (md->md_provider[0] != '\0') 4632d1661a5SPawel Jakub Dawidek disk->d_flags |= G_RAID3_DISK_FLAG_HARDCODED; 4642d1661a5SPawel Jakub Dawidek disk->d_sync.ds_consumer = NULL; 4652d1661a5SPawel Jakub Dawidek disk->d_sync.ds_offset = md->md_sync_offset; 4662d1661a5SPawel Jakub Dawidek disk->d_sync.ds_offset_done = md->md_sync_offset; 4672d1661a5SPawel Jakub Dawidek disk->d_sync.ds_syncid = md->md_syncid; 4682d1661a5SPawel Jakub Dawidek if (errorp != NULL) 4692d1661a5SPawel Jakub Dawidek *errorp = 0; 4702d1661a5SPawel Jakub Dawidek return (disk); 4712d1661a5SPawel Jakub Dawidek fail: 4722d1661a5SPawel Jakub Dawidek if (errorp != NULL) 4732d1661a5SPawel Jakub Dawidek *errorp = error; 4742d1661a5SPawel Jakub Dawidek if (disk != NULL) 4752d1661a5SPawel Jakub Dawidek g_raid3_disconnect_consumer(sc, disk->d_consumer); 4762d1661a5SPawel Jakub Dawidek return (NULL); 4772d1661a5SPawel Jakub Dawidek } 4782d1661a5SPawel Jakub Dawidek 4792d1661a5SPawel Jakub Dawidek static void 4802d1661a5SPawel Jakub Dawidek g_raid3_destroy_disk(struct g_raid3_disk *disk) 4812d1661a5SPawel Jakub Dawidek { 4822d1661a5SPawel Jakub Dawidek struct g_raid3_softc *sc; 4832d1661a5SPawel Jakub Dawidek 4842d1661a5SPawel Jakub Dawidek g_topology_assert(); 4852d1661a5SPawel Jakub Dawidek 4862d1661a5SPawel Jakub Dawidek if (disk->d_state == G_RAID3_DISK_STATE_NODISK) 4872d1661a5SPawel Jakub Dawidek return; 4882d1661a5SPawel Jakub Dawidek g_raid3_event_cancel(disk); 4892d1661a5SPawel Jakub Dawidek sc = disk->d_softc; 4902d1661a5SPawel Jakub Dawidek switch (disk->d_state) { 4912d1661a5SPawel Jakub Dawidek case G_RAID3_DISK_STATE_SYNCHRONIZING: 4922d1661a5SPawel Jakub Dawidek if (sc->sc_syncdisk != NULL) 4932d1661a5SPawel Jakub Dawidek g_raid3_sync_stop(sc, 1); 4942d1661a5SPawel Jakub Dawidek /* FALLTHROUGH */ 4952d1661a5SPawel Jakub Dawidek case G_RAID3_DISK_STATE_NEW: 4962d1661a5SPawel Jakub Dawidek case G_RAID3_DISK_STATE_STALE: 4972d1661a5SPawel Jakub Dawidek case G_RAID3_DISK_STATE_ACTIVE: 4982d1661a5SPawel Jakub Dawidek g_raid3_disconnect_consumer(sc, disk->d_consumer); 4992d1661a5SPawel Jakub Dawidek disk->d_consumer = NULL; 5002d1661a5SPawel Jakub Dawidek break; 5012d1661a5SPawel Jakub Dawidek default: 5022d1661a5SPawel Jakub Dawidek KASSERT(0 == 1, ("Wrong disk state (%s, %s).", 5032d1661a5SPawel Jakub Dawidek g_raid3_get_diskname(disk), 5042d1661a5SPawel Jakub Dawidek g_raid3_disk_state2str(disk->d_state))); 5052d1661a5SPawel Jakub Dawidek } 5062d1661a5SPawel Jakub Dawidek disk->d_state = G_RAID3_DISK_STATE_NODISK; 5072d1661a5SPawel Jakub Dawidek } 5082d1661a5SPawel Jakub Dawidek 5092d1661a5SPawel Jakub Dawidek static void 5102d1661a5SPawel Jakub Dawidek g_raid3_destroy_device(struct g_raid3_softc *sc) 5112d1661a5SPawel Jakub Dawidek { 5122d1661a5SPawel Jakub Dawidek struct g_raid3_event *ep; 5132d1661a5SPawel Jakub Dawidek struct g_geom *gp; 5142d1661a5SPawel Jakub Dawidek struct g_consumer *cp; 5152d1661a5SPawel Jakub Dawidek u_int n; 5162d1661a5SPawel Jakub Dawidek 5172d1661a5SPawel Jakub Dawidek g_topology_assert(); 5182d1661a5SPawel Jakub Dawidek 5192d1661a5SPawel Jakub Dawidek gp = sc->sc_geom; 5202d1661a5SPawel Jakub Dawidek if (sc->sc_provider != NULL) 5212d1661a5SPawel Jakub Dawidek g_raid3_destroy_provider(sc); 5222d1661a5SPawel Jakub Dawidek for (n = 0; n < sc->sc_ndisks; n++) 5232d1661a5SPawel Jakub Dawidek g_raid3_destroy_disk(&sc->sc_disks[n]); 5242d1661a5SPawel Jakub Dawidek while ((ep = g_raid3_event_get(sc)) != NULL) { 5252d1661a5SPawel Jakub Dawidek if ((ep->e_flags & G_RAID3_EVENT_DONTWAIT) != 0) 5262d1661a5SPawel Jakub Dawidek g_raid3_event_free(ep); 5272d1661a5SPawel Jakub Dawidek else { 5282d1661a5SPawel Jakub Dawidek ep->e_error = ECANCELED; 5292d1661a5SPawel Jakub Dawidek ep->e_flags |= G_RAID3_EVENT_DONE; 5302d1661a5SPawel Jakub Dawidek G_RAID3_DEBUG(4, "%s: Waking up %p.", __func__, ep); 5312d1661a5SPawel Jakub Dawidek mtx_lock(&sc->sc_events_mtx); 5322d1661a5SPawel Jakub Dawidek wakeup(ep); 5332d1661a5SPawel Jakub Dawidek mtx_unlock(&sc->sc_events_mtx); 5342d1661a5SPawel Jakub Dawidek } 5352d1661a5SPawel Jakub Dawidek } 5362d1661a5SPawel Jakub Dawidek callout_drain(&sc->sc_callout); 5372d1661a5SPawel Jakub Dawidek gp->softc = NULL; 5382d1661a5SPawel Jakub Dawidek cp = LIST_FIRST(&sc->sc_sync.ds_geom->consumer); 5392d1661a5SPawel Jakub Dawidek if (cp != NULL) 5402d1661a5SPawel Jakub Dawidek g_raid3_disconnect_consumer(sc, cp); 5412d1661a5SPawel Jakub Dawidek sc->sc_sync.ds_geom->softc = NULL; 5422d1661a5SPawel Jakub Dawidek g_wither_geom(sc->sc_sync.ds_geom, ENXIO); 5432d1661a5SPawel Jakub Dawidek uma_zdestroy(sc->sc_zone_64k); 5442d1661a5SPawel Jakub Dawidek uma_zdestroy(sc->sc_zone_16k); 5452d1661a5SPawel Jakub Dawidek uma_zdestroy(sc->sc_zone_4k); 5462d1661a5SPawel Jakub Dawidek mtx_destroy(&sc->sc_queue_mtx); 5472d1661a5SPawel Jakub Dawidek mtx_destroy(&sc->sc_events_mtx); 5482d1661a5SPawel Jakub Dawidek G_RAID3_DEBUG(0, "Device %s destroyed.", gp->name); 5492d1661a5SPawel Jakub Dawidek g_wither_geom(gp, ENXIO); 5502d1661a5SPawel Jakub Dawidek } 5512d1661a5SPawel Jakub Dawidek 5522d1661a5SPawel Jakub Dawidek static void 5532d1661a5SPawel Jakub Dawidek g_raid3_orphan(struct g_consumer *cp) 5542d1661a5SPawel Jakub Dawidek { 5552d1661a5SPawel Jakub Dawidek struct g_raid3_disk *disk; 5562d1661a5SPawel Jakub Dawidek 5572d1661a5SPawel Jakub Dawidek g_topology_assert(); 5582d1661a5SPawel Jakub Dawidek 5592d1661a5SPawel Jakub Dawidek disk = cp->private; 5602d1661a5SPawel Jakub Dawidek if (disk == NULL) 5612d1661a5SPawel Jakub Dawidek return; 5622d1661a5SPawel Jakub Dawidek disk->d_softc->sc_bump_syncid = G_RAID3_BUMP_ON_FIRST_WRITE; 5632d1661a5SPawel Jakub Dawidek g_raid3_event_send(disk, G_RAID3_DISK_STATE_DISCONNECTED, 5642d1661a5SPawel Jakub Dawidek G_RAID3_EVENT_DONTWAIT); 5652d1661a5SPawel Jakub Dawidek } 5662d1661a5SPawel Jakub Dawidek 5672d1661a5SPawel Jakub Dawidek static void 5682d1661a5SPawel Jakub Dawidek g_raid3_spoiled(struct g_consumer *cp) 5692d1661a5SPawel Jakub Dawidek { 5702d1661a5SPawel Jakub Dawidek struct g_raid3_disk *disk; 5712d1661a5SPawel Jakub Dawidek 5722d1661a5SPawel Jakub Dawidek g_topology_assert(); 5732d1661a5SPawel Jakub Dawidek 5742d1661a5SPawel Jakub Dawidek disk = cp->private; 5752d1661a5SPawel Jakub Dawidek if (disk == NULL) 5762d1661a5SPawel Jakub Dawidek return; 5772d1661a5SPawel Jakub Dawidek disk->d_softc->sc_bump_syncid = G_RAID3_BUMP_IMMEDIATELY; 5782d1661a5SPawel Jakub Dawidek g_raid3_event_send(disk, G_RAID3_DISK_STATE_DISCONNECTED, 5792d1661a5SPawel Jakub Dawidek G_RAID3_EVENT_DONTWAIT); 5802d1661a5SPawel Jakub Dawidek } 5812d1661a5SPawel Jakub Dawidek 5822d1661a5SPawel Jakub Dawidek static int 5832d1661a5SPawel Jakub Dawidek g_raid3_write_metadata(struct g_raid3_disk *disk, struct g_raid3_metadata *md) 5842d1661a5SPawel Jakub Dawidek { 5852d1661a5SPawel Jakub Dawidek struct g_raid3_softc *sc; 5862d1661a5SPawel Jakub Dawidek struct g_consumer *cp; 5872d1661a5SPawel Jakub Dawidek off_t offset, length; 5882d1661a5SPawel Jakub Dawidek int close = 0, error = 0; 5892d1661a5SPawel Jakub Dawidek u_char *sector; 5902d1661a5SPawel Jakub Dawidek 5912d1661a5SPawel Jakub Dawidek g_topology_assert(); 5922d1661a5SPawel Jakub Dawidek 5932d1661a5SPawel Jakub Dawidek sc = disk->d_softc; 5942d1661a5SPawel Jakub Dawidek cp = disk->d_consumer; 5952d1661a5SPawel Jakub Dawidek KASSERT(cp != NULL, ("NULL consumer (%s).", sc->sc_name)); 5962d1661a5SPawel Jakub Dawidek KASSERT(cp->provider != NULL, ("NULL provider (%s).", sc->sc_name)); 5972d1661a5SPawel Jakub Dawidek length = cp->provider->sectorsize; 5982d1661a5SPawel Jakub Dawidek offset = cp->provider->mediasize - length; 5992d1661a5SPawel Jakub Dawidek sector = malloc((size_t)length, M_RAID3, M_WAITOK | M_ZERO); 6002d1661a5SPawel Jakub Dawidek /* 6012d1661a5SPawel Jakub Dawidek * Open consumer if it wasn't opened and remember to close it. 6022d1661a5SPawel Jakub Dawidek */ 6032d1661a5SPawel Jakub Dawidek if ((disk->d_flags & G_RAID3_DISK_FLAG_DIRTY) == 0) { 6042d1661a5SPawel Jakub Dawidek error = g_access(cp, 0, 1, 1); 6052d1661a5SPawel Jakub Dawidek G_RAID3_DEBUG(2, "Access %s r%dw%de%d = %d", cp->provider->name, 6062d1661a5SPawel Jakub Dawidek 0, 1, 1, error); 6072d1661a5SPawel Jakub Dawidek if (error == 0) 6082d1661a5SPawel Jakub Dawidek close = 1; 6092d1661a5SPawel Jakub Dawidek #ifdef INVARIANTS 6102d1661a5SPawel Jakub Dawidek } else { 6112d1661a5SPawel Jakub Dawidek KASSERT(cp->acw > 0 && cp->ace > 0, 6122d1661a5SPawel Jakub Dawidek ("Consumer %s not opened (r%dw%de%d).", cp->provider->name, 6132d1661a5SPawel Jakub Dawidek cp->acr, cp->acw, cp->ace)); 6142d1661a5SPawel Jakub Dawidek #endif 6152d1661a5SPawel Jakub Dawidek } 6162d1661a5SPawel Jakub Dawidek if (error == 0) { 6172d1661a5SPawel Jakub Dawidek if (md != NULL) 6182d1661a5SPawel Jakub Dawidek raid3_metadata_encode(md, sector); 6192d1661a5SPawel Jakub Dawidek g_topology_unlock(); 6202d1661a5SPawel Jakub Dawidek error = g_write_data(cp, offset, sector, length); 6212d1661a5SPawel Jakub Dawidek g_topology_lock(); 6222d1661a5SPawel Jakub Dawidek } 6232d1661a5SPawel Jakub Dawidek free(sector, M_RAID3); 6242d1661a5SPawel Jakub Dawidek if (close) { 6252d1661a5SPawel Jakub Dawidek g_access(cp, 0, -1, -1); 6262d1661a5SPawel Jakub Dawidek G_RAID3_DEBUG(2, "Access %s r%dw%de%d = %d", 6272d1661a5SPawel Jakub Dawidek cp->provider->name, 0, -1, -1, 0); 6282d1661a5SPawel Jakub Dawidek } 6292d1661a5SPawel Jakub Dawidek if (error != 0) { 6302d1661a5SPawel Jakub Dawidek disk->d_softc->sc_bump_syncid = G_RAID3_BUMP_IMMEDIATELY; 6312d1661a5SPawel Jakub Dawidek g_raid3_event_send(disk, G_RAID3_DISK_STATE_DISCONNECTED, 6322d1661a5SPawel Jakub Dawidek G_RAID3_EVENT_DONTWAIT); 6332d1661a5SPawel Jakub Dawidek } 6342d1661a5SPawel Jakub Dawidek return (error); 6352d1661a5SPawel Jakub Dawidek } 6362d1661a5SPawel Jakub Dawidek 6372d1661a5SPawel Jakub Dawidek int 6382d1661a5SPawel Jakub Dawidek g_raid3_clear_metadata(struct g_raid3_disk *disk) 6392d1661a5SPawel Jakub Dawidek { 6402d1661a5SPawel Jakub Dawidek int error; 6412d1661a5SPawel Jakub Dawidek 6422d1661a5SPawel Jakub Dawidek g_topology_assert(); 6432d1661a5SPawel Jakub Dawidek error = g_raid3_write_metadata(disk, NULL); 6442d1661a5SPawel Jakub Dawidek if (error == 0) { 6452d1661a5SPawel Jakub Dawidek G_RAID3_DEBUG(2, "Metadata on %s cleared.", 6462d1661a5SPawel Jakub Dawidek g_raid3_get_diskname(disk)); 6472d1661a5SPawel Jakub Dawidek } else { 6482d1661a5SPawel Jakub Dawidek G_RAID3_DEBUG(0, 6492d1661a5SPawel Jakub Dawidek "Cannot clear metadata on disk %s (error=%d).", 6502d1661a5SPawel Jakub Dawidek g_raid3_get_diskname(disk), error); 6512d1661a5SPawel Jakub Dawidek } 6522d1661a5SPawel Jakub Dawidek return (error); 6532d1661a5SPawel Jakub Dawidek } 6542d1661a5SPawel Jakub Dawidek 6552d1661a5SPawel Jakub Dawidek void 6562d1661a5SPawel Jakub Dawidek g_raid3_fill_metadata(struct g_raid3_disk *disk, struct g_raid3_metadata *md) 6572d1661a5SPawel Jakub Dawidek { 6582d1661a5SPawel Jakub Dawidek struct g_raid3_softc *sc; 6592d1661a5SPawel Jakub Dawidek 6602d1661a5SPawel Jakub Dawidek sc = disk->d_softc; 6612d1661a5SPawel Jakub Dawidek strlcpy(md->md_magic, G_RAID3_MAGIC, sizeof(md->md_magic)); 6622d1661a5SPawel Jakub Dawidek md->md_version = G_RAID3_VERSION; 6632d1661a5SPawel Jakub Dawidek strlcpy(md->md_name, sc->sc_name, sizeof(md->md_name)); 6642d1661a5SPawel Jakub Dawidek md->md_id = sc->sc_id; 6652d1661a5SPawel Jakub Dawidek md->md_all = sc->sc_ndisks; 6662d1661a5SPawel Jakub Dawidek md->md_mediasize = sc->sc_mediasize; 6672d1661a5SPawel Jakub Dawidek md->md_sectorsize = sc->sc_sectorsize; 6682d1661a5SPawel Jakub Dawidek md->md_mflags = (sc->sc_flags & G_RAID3_DEVICE_FLAG_MASK); 6692d1661a5SPawel Jakub Dawidek md->md_no = disk->d_no; 6702d1661a5SPawel Jakub Dawidek md->md_syncid = disk->d_sync.ds_syncid; 6712d1661a5SPawel Jakub Dawidek md->md_dflags = (disk->d_flags & G_RAID3_DISK_FLAG_MASK); 6722d1661a5SPawel Jakub Dawidek if (disk->d_state == G_RAID3_DISK_STATE_SYNCHRONIZING) 6732d1661a5SPawel Jakub Dawidek md->md_sync_offset = disk->d_sync.ds_offset_done; 6742d1661a5SPawel Jakub Dawidek else 6752d1661a5SPawel Jakub Dawidek md->md_sync_offset = 0; 6762d1661a5SPawel Jakub Dawidek if ((disk->d_flags & G_RAID3_DISK_FLAG_HARDCODED) != 0 && 6772d1661a5SPawel Jakub Dawidek disk->d_consumer != NULL && disk->d_consumer->provider != NULL) { 6782d1661a5SPawel Jakub Dawidek strlcpy(md->md_provider, disk->d_consumer->provider->name, 6792d1661a5SPawel Jakub Dawidek sizeof(md->md_provider)); 6802d1661a5SPawel Jakub Dawidek } else { 6812d1661a5SPawel Jakub Dawidek bzero(md->md_provider, sizeof(md->md_provider)); 6822d1661a5SPawel Jakub Dawidek } 6832d1661a5SPawel Jakub Dawidek } 6842d1661a5SPawel Jakub Dawidek 6852d1661a5SPawel Jakub Dawidek void 6862d1661a5SPawel Jakub Dawidek g_raid3_update_metadata(struct g_raid3_disk *disk) 6872d1661a5SPawel Jakub Dawidek { 6882d1661a5SPawel Jakub Dawidek struct g_raid3_metadata md; 6892d1661a5SPawel Jakub Dawidek int error; 6902d1661a5SPawel Jakub Dawidek 6912d1661a5SPawel Jakub Dawidek g_topology_assert(); 6922d1661a5SPawel Jakub Dawidek g_raid3_fill_metadata(disk, &md); 6932d1661a5SPawel Jakub Dawidek error = g_raid3_write_metadata(disk, &md); 6942d1661a5SPawel Jakub Dawidek if (error == 0) { 6952d1661a5SPawel Jakub Dawidek G_RAID3_DEBUG(2, "Metadata on %s updated.", 6962d1661a5SPawel Jakub Dawidek g_raid3_get_diskname(disk)); 6972d1661a5SPawel Jakub Dawidek } else { 6982d1661a5SPawel Jakub Dawidek G_RAID3_DEBUG(0, 6992d1661a5SPawel Jakub Dawidek "Cannot update metadata on disk %s (error=%d).", 7002d1661a5SPawel Jakub Dawidek g_raid3_get_diskname(disk), error); 7012d1661a5SPawel Jakub Dawidek } 7022d1661a5SPawel Jakub Dawidek } 7032d1661a5SPawel Jakub Dawidek 7042d1661a5SPawel Jakub Dawidek static void 7052d1661a5SPawel Jakub Dawidek g_raid3_bump_syncid(struct g_raid3_softc *sc) 7062d1661a5SPawel Jakub Dawidek { 7072d1661a5SPawel Jakub Dawidek struct g_raid3_disk *disk; 7082d1661a5SPawel Jakub Dawidek u_int n; 7092d1661a5SPawel Jakub Dawidek 7102d1661a5SPawel Jakub Dawidek g_topology_assert(); 7112d1661a5SPawel Jakub Dawidek KASSERT(g_raid3_ndisks(sc, G_RAID3_DISK_STATE_ACTIVE) > 0, 7122d1661a5SPawel Jakub Dawidek ("%s called with no active disks (device=%s).", __func__, 7132d1661a5SPawel Jakub Dawidek sc->sc_name)); 7142d1661a5SPawel Jakub Dawidek 7152d1661a5SPawel Jakub Dawidek sc->sc_syncid++; 7162d1661a5SPawel Jakub Dawidek for (n = 0; n < sc->sc_ndisks; n++) { 7172d1661a5SPawel Jakub Dawidek disk = &sc->sc_disks[n]; 7182d1661a5SPawel Jakub Dawidek if (disk->d_state == G_RAID3_DISK_STATE_ACTIVE || 7192d1661a5SPawel Jakub Dawidek disk->d_state == G_RAID3_DISK_STATE_SYNCHRONIZING) { 7202d1661a5SPawel Jakub Dawidek disk->d_sync.ds_syncid = sc->sc_syncid; 7212d1661a5SPawel Jakub Dawidek g_raid3_update_metadata(disk); 7222d1661a5SPawel Jakub Dawidek } 7232d1661a5SPawel Jakub Dawidek } 7242d1661a5SPawel Jakub Dawidek } 7252d1661a5SPawel Jakub Dawidek 7262d1661a5SPawel Jakub Dawidek /* 7272d1661a5SPawel Jakub Dawidek * Treat bio_driver1 field in parent bio as list head and field bio_caller1 7282d1661a5SPawel Jakub Dawidek * in child bio as pointer to the next element on the list. 7292d1661a5SPawel Jakub Dawidek */ 7302d1661a5SPawel Jakub Dawidek #define G_RAID3_HEAD_BIO(pbp) (pbp)->bio_driver1 7312d1661a5SPawel Jakub Dawidek 7322d1661a5SPawel Jakub Dawidek #define G_RAID3_NEXT_BIO(cbp) (cbp)->bio_caller1 7332d1661a5SPawel Jakub Dawidek 7342d1661a5SPawel Jakub Dawidek #define G_RAID3_FOREACH_BIO(pbp, bp) \ 7352d1661a5SPawel Jakub Dawidek for ((bp) = G_RAID3_HEAD_BIO(pbp); (bp) != NULL; \ 7362d1661a5SPawel Jakub Dawidek (bp) = G_RAID3_NEXT_BIO(bp)) 7372d1661a5SPawel Jakub Dawidek 7382d1661a5SPawel Jakub Dawidek #define G_RAID3_FOREACH_SAFE_BIO(pbp, bp, tmpbp) \ 7392d1661a5SPawel Jakub Dawidek for ((bp) = G_RAID3_HEAD_BIO(pbp); \ 7402d1661a5SPawel Jakub Dawidek (bp) != NULL && ((tmpbp) = G_RAID3_NEXT_BIO(bp), 1); \ 7412d1661a5SPawel Jakub Dawidek (bp) = (tmpbp)) 7422d1661a5SPawel Jakub Dawidek 7432d1661a5SPawel Jakub Dawidek static void 7442d1661a5SPawel Jakub Dawidek g_raid3_init_bio(struct bio *pbp) 7452d1661a5SPawel Jakub Dawidek { 7462d1661a5SPawel Jakub Dawidek 7472d1661a5SPawel Jakub Dawidek G_RAID3_HEAD_BIO(pbp) = NULL; 7482d1661a5SPawel Jakub Dawidek } 7492d1661a5SPawel Jakub Dawidek 7502d1661a5SPawel Jakub Dawidek static void 751dba915cfSPawel Jakub Dawidek g_raid3_remove_bio(struct bio *cbp) 752dba915cfSPawel Jakub Dawidek { 753dba915cfSPawel Jakub Dawidek struct bio *pbp, *bp; 754dba915cfSPawel Jakub Dawidek 755dba915cfSPawel Jakub Dawidek pbp = cbp->bio_parent; 756dba915cfSPawel Jakub Dawidek if (G_RAID3_HEAD_BIO(pbp) == cbp) 757dba915cfSPawel Jakub Dawidek G_RAID3_HEAD_BIO(pbp) = G_RAID3_NEXT_BIO(cbp); 758dba915cfSPawel Jakub Dawidek else { 759dba915cfSPawel Jakub Dawidek G_RAID3_FOREACH_BIO(pbp, bp) { 760dba915cfSPawel Jakub Dawidek if (G_RAID3_NEXT_BIO(bp) == cbp) { 761dba915cfSPawel Jakub Dawidek G_RAID3_NEXT_BIO(bp) = G_RAID3_NEXT_BIO(cbp); 762dba915cfSPawel Jakub Dawidek break; 763dba915cfSPawel Jakub Dawidek } 764dba915cfSPawel Jakub Dawidek } 765dba915cfSPawel Jakub Dawidek } 766dba915cfSPawel Jakub Dawidek G_RAID3_NEXT_BIO(cbp) = NULL; 767dba915cfSPawel Jakub Dawidek } 768dba915cfSPawel Jakub Dawidek 769dba915cfSPawel Jakub Dawidek static void 770dba915cfSPawel Jakub Dawidek g_raid3_replace_bio(struct bio *sbp, struct bio *dbp) 771dba915cfSPawel Jakub Dawidek { 772dba915cfSPawel Jakub Dawidek struct bio *pbp, *bp; 773dba915cfSPawel Jakub Dawidek 774dba915cfSPawel Jakub Dawidek g_raid3_remove_bio(sbp); 775dba915cfSPawel Jakub Dawidek pbp = dbp->bio_parent; 776dba915cfSPawel Jakub Dawidek G_RAID3_NEXT_BIO(sbp) = G_RAID3_NEXT_BIO(dbp); 777dba915cfSPawel Jakub Dawidek if (G_RAID3_HEAD_BIO(pbp) == dbp) 778dba915cfSPawel Jakub Dawidek G_RAID3_HEAD_BIO(pbp) = sbp; 779dba915cfSPawel Jakub Dawidek else { 780dba915cfSPawel Jakub Dawidek G_RAID3_FOREACH_BIO(pbp, bp) { 781dba915cfSPawel Jakub Dawidek if (G_RAID3_NEXT_BIO(bp) == dbp) { 782dba915cfSPawel Jakub Dawidek G_RAID3_NEXT_BIO(bp) = sbp; 783dba915cfSPawel Jakub Dawidek break; 784dba915cfSPawel Jakub Dawidek } 785dba915cfSPawel Jakub Dawidek } 786dba915cfSPawel Jakub Dawidek } 787dba915cfSPawel Jakub Dawidek G_RAID3_NEXT_BIO(dbp) = NULL; 788dba915cfSPawel Jakub Dawidek } 789dba915cfSPawel Jakub Dawidek 790dba915cfSPawel Jakub Dawidek static void 7912d1661a5SPawel Jakub Dawidek g_raid3_destroy_bio(struct g_raid3_softc *sc, struct bio *cbp) 7922d1661a5SPawel Jakub Dawidek { 7932d1661a5SPawel Jakub Dawidek struct bio *bp, *pbp; 7942d1661a5SPawel Jakub Dawidek size_t size; 7952d1661a5SPawel Jakub Dawidek 7962d1661a5SPawel Jakub Dawidek pbp = cbp->bio_parent; 7972d1661a5SPawel Jakub Dawidek pbp->bio_children--; 7982d1661a5SPawel Jakub Dawidek KASSERT(cbp->bio_data != NULL, ("NULL bio_data")); 7992d1661a5SPawel Jakub Dawidek size = pbp->bio_length / (sc->sc_ndisks - 1); 8002d1661a5SPawel Jakub Dawidek if (size > 16384) 8012d1661a5SPawel Jakub Dawidek uma_zfree(sc->sc_zone_64k, cbp->bio_data); 8022d1661a5SPawel Jakub Dawidek else if (size > 4096) 8032d1661a5SPawel Jakub Dawidek uma_zfree(sc->sc_zone_16k, cbp->bio_data); 8042d1661a5SPawel Jakub Dawidek else 8052d1661a5SPawel Jakub Dawidek uma_zfree(sc->sc_zone_4k, cbp->bio_data); 8062d1661a5SPawel Jakub Dawidek if (G_RAID3_HEAD_BIO(pbp) == cbp) { 8072d1661a5SPawel Jakub Dawidek G_RAID3_HEAD_BIO(pbp) = G_RAID3_NEXT_BIO(cbp); 8082d1661a5SPawel Jakub Dawidek G_RAID3_NEXT_BIO(cbp) = NULL; 8092d1661a5SPawel Jakub Dawidek g_destroy_bio(cbp); 8102d1661a5SPawel Jakub Dawidek } else { 8112d1661a5SPawel Jakub Dawidek G_RAID3_FOREACH_BIO(pbp, bp) { 8122d1661a5SPawel Jakub Dawidek if (G_RAID3_NEXT_BIO(bp) == cbp) 8132d1661a5SPawel Jakub Dawidek break; 8142d1661a5SPawel Jakub Dawidek } 815dba915cfSPawel Jakub Dawidek if (bp != NULL) { 816dba915cfSPawel Jakub Dawidek KASSERT(G_RAID3_NEXT_BIO(bp) != NULL, 817dba915cfSPawel Jakub Dawidek ("NULL bp->bio_driver1")); 8182d1661a5SPawel Jakub Dawidek G_RAID3_NEXT_BIO(bp) = G_RAID3_NEXT_BIO(cbp); 8192d1661a5SPawel Jakub Dawidek G_RAID3_NEXT_BIO(cbp) = NULL; 820dba915cfSPawel Jakub Dawidek } 8212d1661a5SPawel Jakub Dawidek g_destroy_bio(cbp); 8222d1661a5SPawel Jakub Dawidek } 8232d1661a5SPawel Jakub Dawidek } 8242d1661a5SPawel Jakub Dawidek 8252d1661a5SPawel Jakub Dawidek static struct bio * 8262d1661a5SPawel Jakub Dawidek g_raid3_clone_bio(struct g_raid3_softc *sc, struct bio *pbp) 8272d1661a5SPawel Jakub Dawidek { 8282d1661a5SPawel Jakub Dawidek struct bio *bp, *cbp; 8292d1661a5SPawel Jakub Dawidek size_t size; 8302d1661a5SPawel Jakub Dawidek 8312d1661a5SPawel Jakub Dawidek cbp = g_clone_bio(pbp); 8322d1661a5SPawel Jakub Dawidek if (cbp == NULL) 8332d1661a5SPawel Jakub Dawidek return (NULL); 8342d1661a5SPawel Jakub Dawidek size = pbp->bio_length / (sc->sc_ndisks - 1); 8352d1661a5SPawel Jakub Dawidek if (size > 16384) { 8362d1661a5SPawel Jakub Dawidek cbp->bio_data = uma_zalloc(sc->sc_zone_64k, M_NOWAIT); 8372d1661a5SPawel Jakub Dawidek g_raid3_64k_requested++; 8382d1661a5SPawel Jakub Dawidek } else if (size > 4096) { 8392d1661a5SPawel Jakub Dawidek cbp->bio_data = uma_zalloc(sc->sc_zone_16k, M_NOWAIT); 8402d1661a5SPawel Jakub Dawidek g_raid3_16k_requested++; 8412d1661a5SPawel Jakub Dawidek } else { 8422d1661a5SPawel Jakub Dawidek cbp->bio_data = uma_zalloc(sc->sc_zone_4k, M_NOWAIT); 8432d1661a5SPawel Jakub Dawidek g_raid3_4k_requested++; 8442d1661a5SPawel Jakub Dawidek } 8452d1661a5SPawel Jakub Dawidek if (cbp->bio_data == NULL) { 8462d1661a5SPawel Jakub Dawidek if (size > 16384) 8472d1661a5SPawel Jakub Dawidek g_raid3_64k_failed++; 8482d1661a5SPawel Jakub Dawidek if (size > 4096) 8492d1661a5SPawel Jakub Dawidek g_raid3_16k_failed++; 8502d1661a5SPawel Jakub Dawidek else 8512d1661a5SPawel Jakub Dawidek g_raid3_4k_failed++; 8522d1661a5SPawel Jakub Dawidek pbp->bio_children--; 8532d1661a5SPawel Jakub Dawidek g_destroy_bio(cbp); 8542d1661a5SPawel Jakub Dawidek return (NULL); 8552d1661a5SPawel Jakub Dawidek } 8562d1661a5SPawel Jakub Dawidek G_RAID3_NEXT_BIO(cbp) = NULL; 8572d1661a5SPawel Jakub Dawidek if (G_RAID3_HEAD_BIO(pbp) == NULL) 8582d1661a5SPawel Jakub Dawidek G_RAID3_HEAD_BIO(pbp) = cbp; 8592d1661a5SPawel Jakub Dawidek else { 8602d1661a5SPawel Jakub Dawidek G_RAID3_FOREACH_BIO(pbp, bp) { 8612d1661a5SPawel Jakub Dawidek if (G_RAID3_NEXT_BIO(bp) == NULL) { 8622d1661a5SPawel Jakub Dawidek G_RAID3_NEXT_BIO(bp) = cbp; 8632d1661a5SPawel Jakub Dawidek break; 8642d1661a5SPawel Jakub Dawidek } 8652d1661a5SPawel Jakub Dawidek } 8662d1661a5SPawel Jakub Dawidek } 8672d1661a5SPawel Jakub Dawidek return (cbp); 8682d1661a5SPawel Jakub Dawidek } 8692d1661a5SPawel Jakub Dawidek 8702d1661a5SPawel Jakub Dawidek static void 8712d1661a5SPawel Jakub Dawidek g_raid3_scatter(struct bio *pbp) 8722d1661a5SPawel Jakub Dawidek { 8732d1661a5SPawel Jakub Dawidek struct g_raid3_softc *sc; 8742d1661a5SPawel Jakub Dawidek struct g_raid3_disk *disk; 8752d1661a5SPawel Jakub Dawidek struct bio *bp, *cbp; 8762d1661a5SPawel Jakub Dawidek off_t atom, cadd, padd, left; 8772d1661a5SPawel Jakub Dawidek 8782d1661a5SPawel Jakub Dawidek sc = pbp->bio_to->geom->softc; 8792d1661a5SPawel Jakub Dawidek bp = NULL; 8802d1661a5SPawel Jakub Dawidek if ((pbp->bio_pflags & G_RAID3_BIO_PFLAG_NOPARITY) == 0) { 8812d1661a5SPawel Jakub Dawidek /* 8822d1661a5SPawel Jakub Dawidek * Find bio for which we should calculate data. 8832d1661a5SPawel Jakub Dawidek */ 8842d1661a5SPawel Jakub Dawidek G_RAID3_FOREACH_BIO(pbp, cbp) { 8852d1661a5SPawel Jakub Dawidek if ((cbp->bio_cflags & G_RAID3_BIO_CFLAG_PARITY) != 0) { 8862d1661a5SPawel Jakub Dawidek bp = cbp; 8872d1661a5SPawel Jakub Dawidek break; 8882d1661a5SPawel Jakub Dawidek } 8892d1661a5SPawel Jakub Dawidek } 8902d1661a5SPawel Jakub Dawidek KASSERT(bp != NULL, ("NULL parity bio.")); 8912d1661a5SPawel Jakub Dawidek } 8922d1661a5SPawel Jakub Dawidek atom = sc->sc_sectorsize / (sc->sc_ndisks - 1); 8932d1661a5SPawel Jakub Dawidek cadd = padd = 0; 8942d1661a5SPawel Jakub Dawidek for (left = pbp->bio_length; left > 0; left -= sc->sc_sectorsize) { 8952d1661a5SPawel Jakub Dawidek G_RAID3_FOREACH_BIO(pbp, cbp) { 8962d1661a5SPawel Jakub Dawidek if (cbp == bp) 8972d1661a5SPawel Jakub Dawidek continue; 8982d1661a5SPawel Jakub Dawidek bcopy(pbp->bio_data + padd, cbp->bio_data + cadd, atom); 8992d1661a5SPawel Jakub Dawidek padd += atom; 9002d1661a5SPawel Jakub Dawidek } 9012d1661a5SPawel Jakub Dawidek cadd += atom; 9022d1661a5SPawel Jakub Dawidek } 9032d1661a5SPawel Jakub Dawidek if ((pbp->bio_pflags & G_RAID3_BIO_PFLAG_NOPARITY) == 0) { 9042d1661a5SPawel Jakub Dawidek struct bio *tmpbp; 9052d1661a5SPawel Jakub Dawidek 9062d1661a5SPawel Jakub Dawidek /* 9072d1661a5SPawel Jakub Dawidek * Calculate parity. 9082d1661a5SPawel Jakub Dawidek */ 9092d1661a5SPawel Jakub Dawidek bzero(bp->bio_data, bp->bio_length); 9102d1661a5SPawel Jakub Dawidek G_RAID3_FOREACH_SAFE_BIO(pbp, cbp, tmpbp) { 9112d1661a5SPawel Jakub Dawidek if (cbp == bp) 9122d1661a5SPawel Jakub Dawidek continue; 9132d1661a5SPawel Jakub Dawidek g_raid3_xor(cbp->bio_data, bp->bio_data, bp->bio_data, 9142d1661a5SPawel Jakub Dawidek bp->bio_length); 9152d1661a5SPawel Jakub Dawidek if ((cbp->bio_cflags & G_RAID3_BIO_CFLAG_NODISK) != 0) 9162d1661a5SPawel Jakub Dawidek g_raid3_destroy_bio(sc, cbp); 9172d1661a5SPawel Jakub Dawidek } 9182d1661a5SPawel Jakub Dawidek } 9192d1661a5SPawel Jakub Dawidek G_RAID3_FOREACH_BIO(pbp, cbp) { 9202d1661a5SPawel Jakub Dawidek struct g_consumer *cp; 9212d1661a5SPawel Jakub Dawidek 9222d1661a5SPawel Jakub Dawidek disk = cbp->bio_caller2; 9232d1661a5SPawel Jakub Dawidek cp = disk->d_consumer; 9242d1661a5SPawel Jakub Dawidek cbp->bio_to = cp->provider; 9252d1661a5SPawel Jakub Dawidek G_RAID3_LOGREQ(3, cbp, "Sending request."); 9262d1661a5SPawel Jakub Dawidek KASSERT(cp->acr > 0 && cp->ace > 0, 9272d1661a5SPawel Jakub Dawidek ("Consumer %s not opened (r%dw%de%d).", cp->provider->name, 9282d1661a5SPawel Jakub Dawidek cp->acr, cp->acw, cp->ace)); 9292d1661a5SPawel Jakub Dawidek g_io_request(cbp, cp); 9302d1661a5SPawel Jakub Dawidek } 9312d1661a5SPawel Jakub Dawidek } 9322d1661a5SPawel Jakub Dawidek 9332d1661a5SPawel Jakub Dawidek static void 9342d1661a5SPawel Jakub Dawidek g_raid3_gather(struct bio *pbp) 9352d1661a5SPawel Jakub Dawidek { 9362d1661a5SPawel Jakub Dawidek struct g_raid3_softc *sc; 9372d1661a5SPawel Jakub Dawidek struct g_raid3_disk *disk; 938f5a2f7feSPawel Jakub Dawidek struct bio *xbp, *fbp, *cbp; 9392d1661a5SPawel Jakub Dawidek off_t atom, cadd, padd, left; 9402d1661a5SPawel Jakub Dawidek 9412d1661a5SPawel Jakub Dawidek sc = pbp->bio_to->geom->softc; 9422d1661a5SPawel Jakub Dawidek /* 943f5a2f7feSPawel Jakub Dawidek * Find bio for which we have to calculate data. 9442d1661a5SPawel Jakub Dawidek * While going through this path, check if all requests 9452d1661a5SPawel Jakub Dawidek * succeeded, if not, deny whole request. 946f5a2f7feSPawel Jakub Dawidek * If we're in COMPLETE mode, we allow one request to fail, 947f5a2f7feSPawel Jakub Dawidek * so if we find one, we're sending it to the parity consumer. 948f5a2f7feSPawel Jakub Dawidek * If there are more failed requests, we deny whole request. 9492d1661a5SPawel Jakub Dawidek */ 950f5a2f7feSPawel Jakub Dawidek xbp = fbp = NULL; 9512d1661a5SPawel Jakub Dawidek G_RAID3_FOREACH_BIO(pbp, cbp) { 9522d1661a5SPawel Jakub Dawidek if ((cbp->bio_cflags & G_RAID3_BIO_CFLAG_PARITY) != 0) { 953f5a2f7feSPawel Jakub Dawidek KASSERT(xbp == NULL, ("More than one parity bio.")); 954f5a2f7feSPawel Jakub Dawidek xbp = cbp; 9552d1661a5SPawel Jakub Dawidek } 9562d1661a5SPawel Jakub Dawidek if (cbp->bio_error == 0) 9572d1661a5SPawel Jakub Dawidek continue; 9582d1661a5SPawel Jakub Dawidek /* 9592d1661a5SPawel Jakub Dawidek * Found failed request. 9602d1661a5SPawel Jakub Dawidek */ 961f5a2f7feSPawel Jakub Dawidek G_RAID3_LOGREQ(0, cbp, "Request failed."); 9622d1661a5SPawel Jakub Dawidek disk = cbp->bio_caller2; 9632d1661a5SPawel Jakub Dawidek if (disk != NULL) { 9642d1661a5SPawel Jakub Dawidek /* 9652d1661a5SPawel Jakub Dawidek * Actually this is pointless to bump syncid, 9662d1661a5SPawel Jakub Dawidek * because whole device is fucked up. 9672d1661a5SPawel Jakub Dawidek */ 9682d1661a5SPawel Jakub Dawidek sc->sc_bump_syncid = G_RAID3_BUMP_IMMEDIATELY; 9692d1661a5SPawel Jakub Dawidek g_raid3_event_send(disk, 9702d1661a5SPawel Jakub Dawidek G_RAID3_DISK_STATE_DISCONNECTED, 9712d1661a5SPawel Jakub Dawidek G_RAID3_EVENT_DONTWAIT); 9722d1661a5SPawel Jakub Dawidek } 973f5a2f7feSPawel Jakub Dawidek if (fbp == NULL) { 974f5a2f7feSPawel Jakub Dawidek if ((pbp->bio_pflags & G_RAID3_BIO_PFLAG_DEGRADED) != 0) { 9752d1661a5SPawel Jakub Dawidek /* 976f5a2f7feSPawel Jakub Dawidek * We are already in degraded mode, so we can't 977f5a2f7feSPawel Jakub Dawidek * accept any failures. 9782d1661a5SPawel Jakub Dawidek */ 979f5a2f7feSPawel Jakub Dawidek if (pbp->bio_error == 0) 980f5a2f7feSPawel Jakub Dawidek pbp->bio_error = fbp->bio_error; 9812d1661a5SPawel Jakub Dawidek } else { 982f5a2f7feSPawel Jakub Dawidek fbp = cbp; 9832d1661a5SPawel Jakub Dawidek } 984f5a2f7feSPawel Jakub Dawidek } else { 9852d1661a5SPawel Jakub Dawidek /* 9862d1661a5SPawel Jakub Dawidek * Next failed request, that's too many. 9872d1661a5SPawel Jakub Dawidek */ 9882d1661a5SPawel Jakub Dawidek if (pbp->bio_error == 0) 989f5a2f7feSPawel Jakub Dawidek pbp->bio_error = fbp->bio_error; 9902d1661a5SPawel Jakub Dawidek } 9912d1661a5SPawel Jakub Dawidek } 9922d1661a5SPawel Jakub Dawidek if (pbp->bio_error != 0) 9932d1661a5SPawel Jakub Dawidek goto finish; 994dba915cfSPawel Jakub Dawidek if (fbp != NULL && (pbp->bio_pflags & G_RAID3_BIO_PFLAG_VERIFY) != 0) { 995dba915cfSPawel Jakub Dawidek pbp->bio_pflags &= ~G_RAID3_BIO_PFLAG_VERIFY; 996dba915cfSPawel Jakub Dawidek if (xbp != fbp) 997dba915cfSPawel Jakub Dawidek g_raid3_replace_bio(xbp, fbp); 998dba915cfSPawel Jakub Dawidek g_raid3_destroy_bio(sc, fbp); 999dba915cfSPawel Jakub Dawidek } else if (fbp != NULL) { 10002d1661a5SPawel Jakub Dawidek struct g_consumer *cp; 10012d1661a5SPawel Jakub Dawidek 10022d1661a5SPawel Jakub Dawidek /* 10032d1661a5SPawel Jakub Dawidek * One request failed, so send the same request to 10042d1661a5SPawel Jakub Dawidek * the parity consumer. 10052d1661a5SPawel Jakub Dawidek */ 1006f5a2f7feSPawel Jakub Dawidek disk = pbp->bio_driver2; 10072d1661a5SPawel Jakub Dawidek if (disk->d_state != G_RAID3_DISK_STATE_ACTIVE) { 1008f5a2f7feSPawel Jakub Dawidek pbp->bio_error = fbp->bio_error; 10092d1661a5SPawel Jakub Dawidek goto finish; 10102d1661a5SPawel Jakub Dawidek } 10112d1661a5SPawel Jakub Dawidek pbp->bio_pflags |= G_RAID3_BIO_PFLAG_DEGRADED; 10122d1661a5SPawel Jakub Dawidek pbp->bio_inbed--; 1013f5a2f7feSPawel Jakub Dawidek fbp->bio_flags &= ~(BIO_DONE | BIO_ERROR); 1014f5a2f7feSPawel Jakub Dawidek if (disk->d_no == sc->sc_ndisks - 1) 1015f5a2f7feSPawel Jakub Dawidek fbp->bio_cflags |= G_RAID3_BIO_CFLAG_PARITY; 1016f5a2f7feSPawel Jakub Dawidek fbp->bio_error = 0; 1017f5a2f7feSPawel Jakub Dawidek fbp->bio_completed = 0; 1018f5a2f7feSPawel Jakub Dawidek fbp->bio_children = 0; 1019f5a2f7feSPawel Jakub Dawidek fbp->bio_inbed = 0; 10202d1661a5SPawel Jakub Dawidek cp = disk->d_consumer; 1021f5a2f7feSPawel Jakub Dawidek fbp->bio_caller2 = disk; 1022f5a2f7feSPawel Jakub Dawidek fbp->bio_to = cp->provider; 1023f5a2f7feSPawel Jakub Dawidek G_RAID3_LOGREQ(3, fbp, "Sending request (recover)."); 10242d1661a5SPawel Jakub Dawidek KASSERT(cp->acr > 0 && cp->ace > 0, 10252d1661a5SPawel Jakub Dawidek ("Consumer %s not opened (r%dw%de%d).", cp->provider->name, 10262d1661a5SPawel Jakub Dawidek cp->acr, cp->acw, cp->ace)); 1027f5a2f7feSPawel Jakub Dawidek g_io_request(fbp, cp); 10282d1661a5SPawel Jakub Dawidek return; 10292d1661a5SPawel Jakub Dawidek } 1030f5a2f7feSPawel Jakub Dawidek if (xbp != NULL) { 1031f5a2f7feSPawel Jakub Dawidek /* 1032f5a2f7feSPawel Jakub Dawidek * Calculate parity. 1033f5a2f7feSPawel Jakub Dawidek */ 1034f5a2f7feSPawel Jakub Dawidek G_RAID3_FOREACH_BIO(pbp, cbp) { 1035f5a2f7feSPawel Jakub Dawidek if ((cbp->bio_cflags & G_RAID3_BIO_CFLAG_PARITY) != 0) 1036f5a2f7feSPawel Jakub Dawidek continue; 1037f5a2f7feSPawel Jakub Dawidek g_raid3_xor(cbp->bio_data, xbp->bio_data, xbp->bio_data, 1038f5a2f7feSPawel Jakub Dawidek xbp->bio_length); 1039f5a2f7feSPawel Jakub Dawidek } 1040f5a2f7feSPawel Jakub Dawidek xbp->bio_cflags &= ~G_RAID3_BIO_CFLAG_PARITY; 1041dba915cfSPawel Jakub Dawidek if ((pbp->bio_pflags & G_RAID3_BIO_PFLAG_VERIFY) != 0) { 1042dba915cfSPawel Jakub Dawidek if (!g_raid3_is_zero(xbp)) { 1043dba915cfSPawel Jakub Dawidek g_raid3_parity_mismatch++; 1044dba915cfSPawel Jakub Dawidek pbp->bio_error = EIO; 1045dba915cfSPawel Jakub Dawidek goto finish; 1046dba915cfSPawel Jakub Dawidek } 1047dba915cfSPawel Jakub Dawidek g_raid3_destroy_bio(sc, xbp); 1048dba915cfSPawel Jakub Dawidek } 10492d1661a5SPawel Jakub Dawidek } 10502d1661a5SPawel Jakub Dawidek atom = sc->sc_sectorsize / (sc->sc_ndisks - 1); 10512d1661a5SPawel Jakub Dawidek cadd = padd = 0; 10522d1661a5SPawel Jakub Dawidek for (left = pbp->bio_length; left > 0; left -= sc->sc_sectorsize) { 10532d1661a5SPawel Jakub Dawidek G_RAID3_FOREACH_BIO(pbp, cbp) { 10542d1661a5SPawel Jakub Dawidek bcopy(cbp->bio_data + cadd, pbp->bio_data + padd, atom); 10552d1661a5SPawel Jakub Dawidek pbp->bio_completed += atom; 10562d1661a5SPawel Jakub Dawidek padd += atom; 10572d1661a5SPawel Jakub Dawidek } 10582d1661a5SPawel Jakub Dawidek cadd += atom; 10592d1661a5SPawel Jakub Dawidek } 10602d1661a5SPawel Jakub Dawidek finish: 10612d1661a5SPawel Jakub Dawidek if (pbp->bio_error == 0) 10622d1661a5SPawel Jakub Dawidek G_RAID3_LOGREQ(3, pbp, "Request finished."); 10634cf67afeSPawel Jakub Dawidek else { 10644cf67afeSPawel Jakub Dawidek if ((pbp->bio_pflags & G_RAID3_BIO_PFLAG_VERIFY) != 0) 10654cf67afeSPawel Jakub Dawidek G_RAID3_LOGREQ(1, pbp, "Verification error."); 10662d1661a5SPawel Jakub Dawidek else 10672d1661a5SPawel Jakub Dawidek G_RAID3_LOGREQ(0, pbp, "Request failed."); 10684cf67afeSPawel Jakub Dawidek } 1069dba915cfSPawel Jakub Dawidek pbp->bio_pflags &= ~G_RAID3_BIO_PFLAG_MASK; 10702d1661a5SPawel Jakub Dawidek g_io_deliver(pbp, pbp->bio_error); 10712d1661a5SPawel Jakub Dawidek while ((cbp = G_RAID3_HEAD_BIO(pbp)) != NULL) 10722d1661a5SPawel Jakub Dawidek g_raid3_destroy_bio(sc, cbp); 10732d1661a5SPawel Jakub Dawidek } 10742d1661a5SPawel Jakub Dawidek 10752d1661a5SPawel Jakub Dawidek static void 10762d1661a5SPawel Jakub Dawidek g_raid3_done(struct bio *bp) 10772d1661a5SPawel Jakub Dawidek { 10782d1661a5SPawel Jakub Dawidek struct g_raid3_softc *sc; 10792d1661a5SPawel Jakub Dawidek 10802d1661a5SPawel Jakub Dawidek sc = bp->bio_from->geom->softc; 10812d1661a5SPawel Jakub Dawidek bp->bio_cflags |= G_RAID3_BIO_CFLAG_REGULAR; 10822d1661a5SPawel Jakub Dawidek G_RAID3_LOGREQ(3, bp, "Regular request done (error=%d).", bp->bio_error); 10832d1661a5SPawel Jakub Dawidek mtx_lock(&sc->sc_queue_mtx); 10842d1661a5SPawel Jakub Dawidek bioq_insert_head(&sc->sc_queue, bp); 10852d1661a5SPawel Jakub Dawidek wakeup(sc); 10862d1661a5SPawel Jakub Dawidek wakeup(&sc->sc_queue); 10872d1661a5SPawel Jakub Dawidek mtx_unlock(&sc->sc_queue_mtx); 10882d1661a5SPawel Jakub Dawidek } 10892d1661a5SPawel Jakub Dawidek 10902d1661a5SPawel Jakub Dawidek static void 10912d1661a5SPawel Jakub Dawidek g_raid3_regular_request(struct bio *cbp) 10922d1661a5SPawel Jakub Dawidek { 10932d1661a5SPawel Jakub Dawidek struct g_raid3_softc *sc; 10942d1661a5SPawel Jakub Dawidek struct g_raid3_disk *disk; 10952d1661a5SPawel Jakub Dawidek struct bio *pbp; 10962d1661a5SPawel Jakub Dawidek 10972d1661a5SPawel Jakub Dawidek g_topology_assert_not(); 10982d1661a5SPawel Jakub Dawidek 10992d1661a5SPawel Jakub Dawidek pbp = cbp->bio_parent; 11002d1661a5SPawel Jakub Dawidek sc = pbp->bio_to->geom->softc; 11012d1661a5SPawel Jakub Dawidek disk = cbp->bio_from->private; 11022d1661a5SPawel Jakub Dawidek if (disk == NULL) { 11032d1661a5SPawel Jakub Dawidek g_topology_lock(); 11042d1661a5SPawel Jakub Dawidek g_raid3_kill_consumer(sc, cbp->bio_from); 11052d1661a5SPawel Jakub Dawidek g_topology_unlock(); 11062d1661a5SPawel Jakub Dawidek } 11072d1661a5SPawel Jakub Dawidek 11082d1661a5SPawel Jakub Dawidek G_RAID3_LOGREQ(3, cbp, "Request finished."); 11092d1661a5SPawel Jakub Dawidek pbp->bio_inbed++; 11102d1661a5SPawel Jakub Dawidek KASSERT(pbp->bio_inbed <= pbp->bio_children, 11112d1661a5SPawel Jakub Dawidek ("bio_inbed (%u) is bigger than bio_children (%u).", pbp->bio_inbed, 11122d1661a5SPawel Jakub Dawidek pbp->bio_children)); 11132d1661a5SPawel Jakub Dawidek if (pbp->bio_inbed != pbp->bio_children) 11142d1661a5SPawel Jakub Dawidek return; 11152d1661a5SPawel Jakub Dawidek switch (pbp->bio_cmd) { 11162d1661a5SPawel Jakub Dawidek case BIO_READ: 11172d1661a5SPawel Jakub Dawidek g_raid3_gather(pbp); 11182d1661a5SPawel Jakub Dawidek break; 11192d1661a5SPawel Jakub Dawidek case BIO_WRITE: 11202d1661a5SPawel Jakub Dawidek case BIO_DELETE: 11212d1661a5SPawel Jakub Dawidek { 11222d1661a5SPawel Jakub Dawidek int error = 0; 11232d1661a5SPawel Jakub Dawidek 11242d1661a5SPawel Jakub Dawidek pbp->bio_completed = pbp->bio_length; 11252d1661a5SPawel Jakub Dawidek while ((cbp = G_RAID3_HEAD_BIO(pbp)) != NULL) { 11262d1661a5SPawel Jakub Dawidek if (cbp->bio_error != 0) { 11272d1661a5SPawel Jakub Dawidek disk = cbp->bio_caller2; 11282d1661a5SPawel Jakub Dawidek if (disk != NULL) { 11292d1661a5SPawel Jakub Dawidek sc->sc_bump_syncid = 11302d1661a5SPawel Jakub Dawidek G_RAID3_BUMP_IMMEDIATELY; 11312d1661a5SPawel Jakub Dawidek g_raid3_event_send(disk, 11322d1661a5SPawel Jakub Dawidek G_RAID3_DISK_STATE_DISCONNECTED, 11332d1661a5SPawel Jakub Dawidek G_RAID3_EVENT_DONTWAIT); 11342d1661a5SPawel Jakub Dawidek } 11352d1661a5SPawel Jakub Dawidek if (error == 0) 11362d1661a5SPawel Jakub Dawidek error = cbp->bio_error; 11372d1661a5SPawel Jakub Dawidek else if (pbp->bio_error == 0) { 11382d1661a5SPawel Jakub Dawidek /* 11392d1661a5SPawel Jakub Dawidek * Next failed request, that's too many. 11402d1661a5SPawel Jakub Dawidek */ 11412d1661a5SPawel Jakub Dawidek pbp->bio_error = error; 11422d1661a5SPawel Jakub Dawidek } 11432d1661a5SPawel Jakub Dawidek } 11442d1661a5SPawel Jakub Dawidek g_raid3_destroy_bio(sc, cbp); 11452d1661a5SPawel Jakub Dawidek } 11462d1661a5SPawel Jakub Dawidek if (pbp->bio_error == 0) 11472d1661a5SPawel Jakub Dawidek G_RAID3_LOGREQ(3, pbp, "Request finished."); 11482d1661a5SPawel Jakub Dawidek else 11492d1661a5SPawel Jakub Dawidek G_RAID3_LOGREQ(0, pbp, "Request failed."); 11502d1661a5SPawel Jakub Dawidek pbp->bio_pflags &= ~G_RAID3_BIO_PFLAG_DEGRADED; 11512d1661a5SPawel Jakub Dawidek pbp->bio_pflags &= ~G_RAID3_BIO_PFLAG_NOPARITY; 11522d1661a5SPawel Jakub Dawidek g_io_deliver(pbp, pbp->bio_error); 11532d1661a5SPawel Jakub Dawidek break; 11542d1661a5SPawel Jakub Dawidek } 11552d1661a5SPawel Jakub Dawidek } 11562d1661a5SPawel Jakub Dawidek } 11572d1661a5SPawel Jakub Dawidek 11582d1661a5SPawel Jakub Dawidek static void 11592d1661a5SPawel Jakub Dawidek g_raid3_sync_done(struct bio *bp) 11602d1661a5SPawel Jakub Dawidek { 11612d1661a5SPawel Jakub Dawidek struct g_raid3_softc *sc; 11622d1661a5SPawel Jakub Dawidek 11632d1661a5SPawel Jakub Dawidek G_RAID3_LOGREQ(3, bp, "Synchronization request delivered."); 11642d1661a5SPawel Jakub Dawidek sc = bp->bio_from->geom->softc; 11652d1661a5SPawel Jakub Dawidek bp->bio_cflags |= G_RAID3_BIO_CFLAG_SYNC; 11662d1661a5SPawel Jakub Dawidek mtx_lock(&sc->sc_queue_mtx); 11672d1661a5SPawel Jakub Dawidek bioq_insert_head(&sc->sc_queue, bp); 11682d1661a5SPawel Jakub Dawidek wakeup(sc); 11692d1661a5SPawel Jakub Dawidek wakeup(&sc->sc_queue); 11702d1661a5SPawel Jakub Dawidek mtx_unlock(&sc->sc_queue_mtx); 11712d1661a5SPawel Jakub Dawidek } 11722d1661a5SPawel Jakub Dawidek 11732d1661a5SPawel Jakub Dawidek static void 11742d1661a5SPawel Jakub Dawidek g_raid3_start(struct bio *bp) 11752d1661a5SPawel Jakub Dawidek { 11762d1661a5SPawel Jakub Dawidek struct g_raid3_softc *sc; 11772d1661a5SPawel Jakub Dawidek 11782d1661a5SPawel Jakub Dawidek sc = bp->bio_to->geom->softc; 11792d1661a5SPawel Jakub Dawidek /* 11802d1661a5SPawel Jakub Dawidek * If sc == NULL or there are no valid disks, provider's error 11812d1661a5SPawel Jakub Dawidek * should be set and g_raid3_start() should not be called at all. 11822d1661a5SPawel Jakub Dawidek */ 11832d1661a5SPawel Jakub Dawidek KASSERT(sc != NULL && (sc->sc_state == G_RAID3_DEVICE_STATE_DEGRADED || 11842d1661a5SPawel Jakub Dawidek sc->sc_state == G_RAID3_DEVICE_STATE_COMPLETE), 11852d1661a5SPawel Jakub Dawidek ("Provider's error should be set (error=%d)(device=%s).", 11862d1661a5SPawel Jakub Dawidek bp->bio_to->error, bp->bio_to->name)); 11872d1661a5SPawel Jakub Dawidek G_RAID3_LOGREQ(3, bp, "Request received."); 11882d1661a5SPawel Jakub Dawidek 11892d1661a5SPawel Jakub Dawidek switch (bp->bio_cmd) { 11902d1661a5SPawel Jakub Dawidek case BIO_READ: 11912d1661a5SPawel Jakub Dawidek case BIO_WRITE: 11922d1661a5SPawel Jakub Dawidek case BIO_DELETE: 11932d1661a5SPawel Jakub Dawidek break; 11942d1661a5SPawel Jakub Dawidek case BIO_GETATTR: 11952d1661a5SPawel Jakub Dawidek default: 11962d1661a5SPawel Jakub Dawidek g_io_deliver(bp, EOPNOTSUPP); 11972d1661a5SPawel Jakub Dawidek return; 11982d1661a5SPawel Jakub Dawidek } 11992d1661a5SPawel Jakub Dawidek mtx_lock(&sc->sc_queue_mtx); 12002d1661a5SPawel Jakub Dawidek bioq_insert_tail(&sc->sc_queue, bp); 12012d1661a5SPawel Jakub Dawidek G_RAID3_DEBUG(4, "%s: Waking up %p.", __func__, sc); 12022d1661a5SPawel Jakub Dawidek wakeup(sc); 12032d1661a5SPawel Jakub Dawidek mtx_unlock(&sc->sc_queue_mtx); 12042d1661a5SPawel Jakub Dawidek } 12052d1661a5SPawel Jakub Dawidek 12062d1661a5SPawel Jakub Dawidek /* 12072d1661a5SPawel Jakub Dawidek * Send one synchronization request. 12082d1661a5SPawel Jakub Dawidek */ 12092d1661a5SPawel Jakub Dawidek static void 12102d1661a5SPawel Jakub Dawidek g_raid3_sync_one(struct g_raid3_softc *sc) 12112d1661a5SPawel Jakub Dawidek { 12122d1661a5SPawel Jakub Dawidek struct g_raid3_disk *disk; 12132d1661a5SPawel Jakub Dawidek struct bio *bp; 12142d1661a5SPawel Jakub Dawidek 12152d1661a5SPawel Jakub Dawidek KASSERT(sc->sc_state == G_RAID3_DEVICE_STATE_DEGRADED, 12162d1661a5SPawel Jakub Dawidek ("Wrong device state (%s, %s).", sc->sc_name, 12172d1661a5SPawel Jakub Dawidek g_raid3_device_state2str(sc->sc_state))); 12182d1661a5SPawel Jakub Dawidek disk = sc->sc_syncdisk; 12192d1661a5SPawel Jakub Dawidek KASSERT(disk != NULL, ("No sync disk (%s).", sc->sc_name)); 12202d1661a5SPawel Jakub Dawidek KASSERT(disk->d_state == G_RAID3_DISK_STATE_SYNCHRONIZING, 12212d1661a5SPawel Jakub Dawidek ("Disk %s is not marked for synchronization.", 12222d1661a5SPawel Jakub Dawidek g_raid3_get_diskname(disk))); 12232d1661a5SPawel Jakub Dawidek 12242d1661a5SPawel Jakub Dawidek bp = g_new_bio(); 12252d1661a5SPawel Jakub Dawidek if (bp == NULL) 12262d1661a5SPawel Jakub Dawidek return; 12272d1661a5SPawel Jakub Dawidek bp->bio_parent = NULL; 12282d1661a5SPawel Jakub Dawidek bp->bio_cmd = BIO_READ; 12292d1661a5SPawel Jakub Dawidek bp->bio_offset = disk->d_sync.ds_offset * (sc->sc_ndisks - 1); 12302d1661a5SPawel Jakub Dawidek bp->bio_length = MIN(G_RAID3_MAX_IO_SIZE, 12312d1661a5SPawel Jakub Dawidek sc->sc_mediasize - bp->bio_offset); 12322d1661a5SPawel Jakub Dawidek bp->bio_cflags = 0; 12332d1661a5SPawel Jakub Dawidek bp->bio_done = g_raid3_sync_done; 12342d1661a5SPawel Jakub Dawidek bp->bio_data = disk->d_sync.ds_data; 12352d1661a5SPawel Jakub Dawidek if (bp->bio_data == NULL) { 12362d1661a5SPawel Jakub Dawidek g_destroy_bio(bp); 12372d1661a5SPawel Jakub Dawidek return; 12382d1661a5SPawel Jakub Dawidek } 12392d1661a5SPawel Jakub Dawidek bp->bio_cflags = G_RAID3_BIO_CFLAG_REGSYNC; 12402d1661a5SPawel Jakub Dawidek disk->d_sync.ds_offset += bp->bio_length / (sc->sc_ndisks - 1); 12412d1661a5SPawel Jakub Dawidek bp->bio_to = sc->sc_provider; 12422d1661a5SPawel Jakub Dawidek G_RAID3_LOGREQ(3, bp, "Sending synchronization request."); 12432d1661a5SPawel Jakub Dawidek g_io_request(bp, disk->d_sync.ds_consumer); 12442d1661a5SPawel Jakub Dawidek } 12452d1661a5SPawel Jakub Dawidek 12462d1661a5SPawel Jakub Dawidek static void 12472d1661a5SPawel Jakub Dawidek g_raid3_sync_request(struct bio *bp) 12482d1661a5SPawel Jakub Dawidek { 12492d1661a5SPawel Jakub Dawidek struct g_raid3_softc *sc; 12502d1661a5SPawel Jakub Dawidek struct g_raid3_disk *disk; 12512d1661a5SPawel Jakub Dawidek 12522d1661a5SPawel Jakub Dawidek sc = bp->bio_from->geom->softc; 12532d1661a5SPawel Jakub Dawidek disk = bp->bio_from->private; 12542d1661a5SPawel Jakub Dawidek if (disk == NULL) { 12552d1661a5SPawel Jakub Dawidek g_topology_lock(); 12562d1661a5SPawel Jakub Dawidek g_raid3_kill_consumer(sc, bp->bio_from); 12572d1661a5SPawel Jakub Dawidek g_topology_unlock(); 12582d1661a5SPawel Jakub Dawidek g_destroy_bio(bp); 12592d1661a5SPawel Jakub Dawidek return; 12602d1661a5SPawel Jakub Dawidek } 12612d1661a5SPawel Jakub Dawidek 12622d1661a5SPawel Jakub Dawidek /* 12632d1661a5SPawel Jakub Dawidek * Synchronization request. 12642d1661a5SPawel Jakub Dawidek */ 12652d1661a5SPawel Jakub Dawidek switch (bp->bio_cmd) { 12662d1661a5SPawel Jakub Dawidek case BIO_READ: 12672d1661a5SPawel Jakub Dawidek { 12682d1661a5SPawel Jakub Dawidek struct g_consumer *cp; 12692d1661a5SPawel Jakub Dawidek u_char *dst, *src; 12702d1661a5SPawel Jakub Dawidek off_t left; 12712d1661a5SPawel Jakub Dawidek u_int atom; 12722d1661a5SPawel Jakub Dawidek 12732d1661a5SPawel Jakub Dawidek if (bp->bio_error != 0) { 12742d1661a5SPawel Jakub Dawidek G_RAID3_LOGREQ(0, bp, 12752d1661a5SPawel Jakub Dawidek "Synchronization request failed (error=%d).", 12762d1661a5SPawel Jakub Dawidek bp->bio_error); 12772d1661a5SPawel Jakub Dawidek g_destroy_bio(bp); 12782d1661a5SPawel Jakub Dawidek return; 12792d1661a5SPawel Jakub Dawidek } 12802d1661a5SPawel Jakub Dawidek G_RAID3_LOGREQ(3, bp, "Synchronization request finished."); 12812d1661a5SPawel Jakub Dawidek atom = sc->sc_sectorsize / (sc->sc_ndisks - 1); 12822d1661a5SPawel Jakub Dawidek dst = src = bp->bio_data; 12832d1661a5SPawel Jakub Dawidek if (disk->d_no == sc->sc_ndisks - 1) { 12842d1661a5SPawel Jakub Dawidek u_int n; 12852d1661a5SPawel Jakub Dawidek 12862d1661a5SPawel Jakub Dawidek /* Parity component. */ 12872d1661a5SPawel Jakub Dawidek for (left = bp->bio_length; left > 0; 12882d1661a5SPawel Jakub Dawidek left -= sc->sc_sectorsize) { 12892d1661a5SPawel Jakub Dawidek bcopy(src, dst, atom); 12902d1661a5SPawel Jakub Dawidek src += atom; 12912d1661a5SPawel Jakub Dawidek for (n = 1; n < sc->sc_ndisks - 1; n++) { 12922d1661a5SPawel Jakub Dawidek g_raid3_xor(src, dst, dst, atom); 12932d1661a5SPawel Jakub Dawidek src += atom; 12942d1661a5SPawel Jakub Dawidek } 12952d1661a5SPawel Jakub Dawidek dst += atom; 12962d1661a5SPawel Jakub Dawidek } 12972d1661a5SPawel Jakub Dawidek } else { 12982d1661a5SPawel Jakub Dawidek /* Regular component. */ 12992d1661a5SPawel Jakub Dawidek src += atom * disk->d_no; 13002d1661a5SPawel Jakub Dawidek for (left = bp->bio_length; left > 0; 13012d1661a5SPawel Jakub Dawidek left -= sc->sc_sectorsize) { 13022d1661a5SPawel Jakub Dawidek bcopy(src, dst, atom); 13032d1661a5SPawel Jakub Dawidek src += sc->sc_sectorsize; 13042d1661a5SPawel Jakub Dawidek dst += atom; 13052d1661a5SPawel Jakub Dawidek } 13062d1661a5SPawel Jakub Dawidek } 13072d1661a5SPawel Jakub Dawidek bp->bio_offset /= sc->sc_ndisks - 1; 13082d1661a5SPawel Jakub Dawidek bp->bio_length /= sc->sc_ndisks - 1; 13092d1661a5SPawel Jakub Dawidek bp->bio_cmd = BIO_WRITE; 13102d1661a5SPawel Jakub Dawidek bp->bio_cflags = 0; 13112d1661a5SPawel Jakub Dawidek bp->bio_children = bp->bio_inbed = 0; 13122d1661a5SPawel Jakub Dawidek cp = disk->d_consumer; 13132d1661a5SPawel Jakub Dawidek KASSERT(cp->acr == 0 && cp->acw == 1 && cp->ace == 1, 13142d1661a5SPawel Jakub Dawidek ("Consumer %s not opened (r%dw%de%d).", cp->provider->name, 13152d1661a5SPawel Jakub Dawidek cp->acr, cp->acw, cp->ace)); 13162d1661a5SPawel Jakub Dawidek g_io_request(bp, cp); 13172d1661a5SPawel Jakub Dawidek return; 13182d1661a5SPawel Jakub Dawidek } 13192d1661a5SPawel Jakub Dawidek case BIO_WRITE: 13202d1661a5SPawel Jakub Dawidek if (bp->bio_error != 0) { 13212d1661a5SPawel Jakub Dawidek G_RAID3_LOGREQ(0, bp, 13222d1661a5SPawel Jakub Dawidek "Synchronization request failed (error=%d).", 13232d1661a5SPawel Jakub Dawidek bp->bio_error); 13242d1661a5SPawel Jakub Dawidek g_destroy_bio(bp); 13252d1661a5SPawel Jakub Dawidek sc->sc_bump_syncid = G_RAID3_BUMP_IMMEDIATELY; 13262d1661a5SPawel Jakub Dawidek g_raid3_event_send(disk, 13272d1661a5SPawel Jakub Dawidek G_RAID3_DISK_STATE_DISCONNECTED, 13282d1661a5SPawel Jakub Dawidek G_RAID3_EVENT_DONTWAIT); 13292d1661a5SPawel Jakub Dawidek return; 13302d1661a5SPawel Jakub Dawidek } 13312d1661a5SPawel Jakub Dawidek G_RAID3_LOGREQ(3, bp, "Synchronization request finished."); 13322d1661a5SPawel Jakub Dawidek disk->d_sync.ds_offset_done = bp->bio_offset + bp->bio_length; 13332d1661a5SPawel Jakub Dawidek g_destroy_bio(bp); 13342d1661a5SPawel Jakub Dawidek if (disk->d_sync.ds_offset_done == 1335c0d68b6eSPawel Jakub Dawidek sc->sc_mediasize / (sc->sc_ndisks - 1)) { 13362d1661a5SPawel Jakub Dawidek /* 13372d1661a5SPawel Jakub Dawidek * Disk up-to-date, activate it. 13382d1661a5SPawel Jakub Dawidek */ 13392d1661a5SPawel Jakub Dawidek g_raid3_event_send(disk, G_RAID3_DISK_STATE_ACTIVE, 13402d1661a5SPawel Jakub Dawidek G_RAID3_EVENT_DONTWAIT); 13412d1661a5SPawel Jakub Dawidek return; 13422d1661a5SPawel Jakub Dawidek } else if ((disk->d_sync.ds_offset_done % 13432d1661a5SPawel Jakub Dawidek (G_RAID3_MAX_IO_SIZE * 100)) == 0) { 13442d1661a5SPawel Jakub Dawidek /* 13452d1661a5SPawel Jakub Dawidek * Update offset_done on every 100 blocks. 13462d1661a5SPawel Jakub Dawidek * XXX: This should be configurable. 13472d1661a5SPawel Jakub Dawidek */ 13482d1661a5SPawel Jakub Dawidek g_topology_lock(); 13492d1661a5SPawel Jakub Dawidek g_raid3_update_metadata(disk); 13502d1661a5SPawel Jakub Dawidek g_topology_unlock(); 13512d1661a5SPawel Jakub Dawidek } 13522d1661a5SPawel Jakub Dawidek return; 13532d1661a5SPawel Jakub Dawidek default: 13542d1661a5SPawel Jakub Dawidek KASSERT(1 == 0, ("Invalid command here: %u (device=%s)", 13552d1661a5SPawel Jakub Dawidek bp->bio_cmd, sc->sc_name)); 13562d1661a5SPawel Jakub Dawidek break; 13572d1661a5SPawel Jakub Dawidek } 13582d1661a5SPawel Jakub Dawidek } 13592d1661a5SPawel Jakub Dawidek 13602d1661a5SPawel Jakub Dawidek static int 13612d1661a5SPawel Jakub Dawidek g_raid3_register_request(struct bio *pbp) 13622d1661a5SPawel Jakub Dawidek { 13632d1661a5SPawel Jakub Dawidek struct g_raid3_softc *sc; 13642d1661a5SPawel Jakub Dawidek struct g_raid3_disk *disk; 13652d1661a5SPawel Jakub Dawidek struct g_consumer *cp; 13662d1661a5SPawel Jakub Dawidek struct bio *cbp; 13672d1661a5SPawel Jakub Dawidek off_t offset, length; 1368fa6a7837SDavid E. O'Brien u_int n, ndisks; 1369dba915cfSPawel Jakub Dawidek int round_robin, verify; 13702d1661a5SPawel Jakub Dawidek 1371fa6a7837SDavid E. O'Brien ndisks = 0; 13722d1661a5SPawel Jakub Dawidek sc = pbp->bio_to->geom->softc; 13732d1661a5SPawel Jakub Dawidek if ((pbp->bio_cflags & G_RAID3_BIO_CFLAG_REGSYNC) != 0 && 13742d1661a5SPawel Jakub Dawidek sc->sc_syncdisk == NULL) { 13752d1661a5SPawel Jakub Dawidek g_io_deliver(pbp, EIO); 13762d1661a5SPawel Jakub Dawidek return (0); 13772d1661a5SPawel Jakub Dawidek } 13782d1661a5SPawel Jakub Dawidek g_raid3_init_bio(pbp); 13792d1661a5SPawel Jakub Dawidek length = pbp->bio_length / (sc->sc_ndisks - 1); 13802d1661a5SPawel Jakub Dawidek offset = pbp->bio_offset / (sc->sc_ndisks - 1); 1381dba915cfSPawel Jakub Dawidek round_robin = verify = 0; 13822d1661a5SPawel Jakub Dawidek switch (pbp->bio_cmd) { 13832d1661a5SPawel Jakub Dawidek case BIO_READ: 1384dba915cfSPawel Jakub Dawidek if ((sc->sc_flags & G_RAID3_DEVICE_FLAG_VERIFY) != 0 && 1385dba915cfSPawel Jakub Dawidek sc->sc_state == G_RAID3_DEVICE_STATE_COMPLETE) { 1386dba915cfSPawel Jakub Dawidek pbp->bio_pflags |= G_RAID3_BIO_PFLAG_VERIFY; 1387dba915cfSPawel Jakub Dawidek verify = 1; 1388dba915cfSPawel Jakub Dawidek ndisks = sc->sc_ndisks; 1389dba915cfSPawel Jakub Dawidek } else { 1390dba915cfSPawel Jakub Dawidek verify = 0; 13912d1661a5SPawel Jakub Dawidek ndisks = sc->sc_ndisks - 1; 1392dba915cfSPawel Jakub Dawidek } 1393dba915cfSPawel Jakub Dawidek if ((sc->sc_flags & G_RAID3_DEVICE_FLAG_ROUND_ROBIN) != 0 && 1394dba915cfSPawel Jakub Dawidek sc->sc_state == G_RAID3_DEVICE_STATE_COMPLETE) { 1395dba915cfSPawel Jakub Dawidek round_robin = 1; 1396dba915cfSPawel Jakub Dawidek } else { 1397dba915cfSPawel Jakub Dawidek round_robin = 0; 1398dba915cfSPawel Jakub Dawidek } 1399dba915cfSPawel Jakub Dawidek KASSERT(!round_robin || !verify, 1400dba915cfSPawel Jakub Dawidek ("ROUND-ROBIN and VERIFY are mutually exclusive.")); 1401f5a2f7feSPawel Jakub Dawidek pbp->bio_driver2 = &sc->sc_disks[sc->sc_ndisks - 1]; 14022d1661a5SPawel Jakub Dawidek break; 14032d1661a5SPawel Jakub Dawidek case BIO_WRITE: 14042d1661a5SPawel Jakub Dawidek case BIO_DELETE: 14052d1661a5SPawel Jakub Dawidek ndisks = sc->sc_ndisks; 14062d1661a5SPawel Jakub Dawidek break; 14072d1661a5SPawel Jakub Dawidek } 14082d1661a5SPawel Jakub Dawidek for (n = 0; n < ndisks; n++) { 14092d1661a5SPawel Jakub Dawidek disk = &sc->sc_disks[n]; 14102d1661a5SPawel Jakub Dawidek cbp = g_raid3_clone_bio(sc, pbp); 14112d1661a5SPawel Jakub Dawidek if (cbp == NULL) { 14122d1661a5SPawel Jakub Dawidek while ((cbp = G_RAID3_HEAD_BIO(pbp)) != NULL) 14132d1661a5SPawel Jakub Dawidek g_raid3_destroy_bio(sc, cbp); 14142d1661a5SPawel Jakub Dawidek return (ENOMEM); 14152d1661a5SPawel Jakub Dawidek } 14162d1661a5SPawel Jakub Dawidek cbp->bio_offset = offset; 14172d1661a5SPawel Jakub Dawidek cbp->bio_length = length; 14182d1661a5SPawel Jakub Dawidek cbp->bio_done = g_raid3_done; 14192d1661a5SPawel Jakub Dawidek switch (pbp->bio_cmd) { 14202d1661a5SPawel Jakub Dawidek case BIO_READ: 14212d1661a5SPawel Jakub Dawidek if (disk->d_state != G_RAID3_DISK_STATE_ACTIVE) { 14222d1661a5SPawel Jakub Dawidek /* 14232d1661a5SPawel Jakub Dawidek * Replace invalid component with the parity 14242d1661a5SPawel Jakub Dawidek * component. 14252d1661a5SPawel Jakub Dawidek */ 14262d1661a5SPawel Jakub Dawidek disk = &sc->sc_disks[sc->sc_ndisks - 1]; 14272d1661a5SPawel Jakub Dawidek cbp->bio_cflags |= G_RAID3_BIO_CFLAG_PARITY; 14282d1661a5SPawel Jakub Dawidek pbp->bio_pflags |= G_RAID3_BIO_PFLAG_DEGRADED; 1429f5a2f7feSPawel Jakub Dawidek } else if (round_robin && 1430f5a2f7feSPawel Jakub Dawidek disk->d_no == sc->sc_round_robin) { 1431f5a2f7feSPawel Jakub Dawidek /* 1432f5a2f7feSPawel Jakub Dawidek * In round-robin mode skip one data component 1433f5a2f7feSPawel Jakub Dawidek * and use parity component when reading. 1434f5a2f7feSPawel Jakub Dawidek */ 1435f5a2f7feSPawel Jakub Dawidek pbp->bio_driver2 = disk; 1436f5a2f7feSPawel Jakub Dawidek disk = &sc->sc_disks[sc->sc_ndisks - 1]; 1437f5a2f7feSPawel Jakub Dawidek cbp->bio_cflags |= G_RAID3_BIO_CFLAG_PARITY; 1438f5a2f7feSPawel Jakub Dawidek sc->sc_round_robin++; 1439f5a2f7feSPawel Jakub Dawidek round_robin = 0; 1440dba915cfSPawel Jakub Dawidek } else if (verify && disk->d_no == sc->sc_ndisks - 1) { 1441dba915cfSPawel Jakub Dawidek cbp->bio_cflags |= G_RAID3_BIO_CFLAG_PARITY; 14422d1661a5SPawel Jakub Dawidek } 14432d1661a5SPawel Jakub Dawidek break; 14442d1661a5SPawel Jakub Dawidek case BIO_WRITE: 14452d1661a5SPawel Jakub Dawidek case BIO_DELETE: 14462d1661a5SPawel Jakub Dawidek if (disk->d_state == G_RAID3_DISK_STATE_ACTIVE || 14472d1661a5SPawel Jakub Dawidek disk->d_state == G_RAID3_DISK_STATE_SYNCHRONIZING) { 14482d1661a5SPawel Jakub Dawidek if (n == ndisks - 1) { 14492d1661a5SPawel Jakub Dawidek /* 14502d1661a5SPawel Jakub Dawidek * Active parity component, mark it as such. 14512d1661a5SPawel Jakub Dawidek */ 14522d1661a5SPawel Jakub Dawidek cbp->bio_cflags |= 14532d1661a5SPawel Jakub Dawidek G_RAID3_BIO_CFLAG_PARITY; 14542d1661a5SPawel Jakub Dawidek } 14552d1661a5SPawel Jakub Dawidek } else { 14562d1661a5SPawel Jakub Dawidek pbp->bio_pflags |= G_RAID3_BIO_PFLAG_DEGRADED; 14572d1661a5SPawel Jakub Dawidek if (n == ndisks - 1) { 14582d1661a5SPawel Jakub Dawidek /* 14592d1661a5SPawel Jakub Dawidek * Parity component is not connected, 14602d1661a5SPawel Jakub Dawidek * so destroy its request. 14612d1661a5SPawel Jakub Dawidek */ 14622d1661a5SPawel Jakub Dawidek pbp->bio_pflags |= 14632d1661a5SPawel Jakub Dawidek G_RAID3_BIO_PFLAG_NOPARITY; 14642d1661a5SPawel Jakub Dawidek g_raid3_destroy_bio(sc, cbp); 14652d1661a5SPawel Jakub Dawidek cbp = NULL; 14662d1661a5SPawel Jakub Dawidek } else { 14672d1661a5SPawel Jakub Dawidek cbp->bio_cflags |= 14682d1661a5SPawel Jakub Dawidek G_RAID3_BIO_CFLAG_NODISK; 14692d1661a5SPawel Jakub Dawidek disk = NULL; 14702d1661a5SPawel Jakub Dawidek } 14712d1661a5SPawel Jakub Dawidek } 14722d1661a5SPawel Jakub Dawidek break; 14732d1661a5SPawel Jakub Dawidek } 14742d1661a5SPawel Jakub Dawidek if (cbp != NULL) 14752d1661a5SPawel Jakub Dawidek cbp->bio_caller2 = disk; 14762d1661a5SPawel Jakub Dawidek } 14772d1661a5SPawel Jakub Dawidek switch (pbp->bio_cmd) { 14782d1661a5SPawel Jakub Dawidek case BIO_READ: 1479f5a2f7feSPawel Jakub Dawidek if (round_robin) { 1480f5a2f7feSPawel Jakub Dawidek /* 1481f5a2f7feSPawel Jakub Dawidek * If we are in round-robin mode and 'round_robin' is 1482f5a2f7feSPawel Jakub Dawidek * still 1, it means, that we skipped parity component 1483f5a2f7feSPawel Jakub Dawidek * for this read and must reset sc_round_robin field. 1484f5a2f7feSPawel Jakub Dawidek */ 1485f5a2f7feSPawel Jakub Dawidek sc->sc_round_robin = 0; 1486f5a2f7feSPawel Jakub Dawidek } 14872d1661a5SPawel Jakub Dawidek G_RAID3_FOREACH_BIO(pbp, cbp) { 14882d1661a5SPawel Jakub Dawidek disk = cbp->bio_caller2; 14892d1661a5SPawel Jakub Dawidek cp = disk->d_consumer; 14902d1661a5SPawel Jakub Dawidek cbp->bio_to = cp->provider; 14912d1661a5SPawel Jakub Dawidek G_RAID3_LOGREQ(3, cbp, "Sending request."); 14922d1661a5SPawel Jakub Dawidek KASSERT(cp->acr > 0 && cp->ace > 0, 14932d1661a5SPawel Jakub Dawidek ("Consumer %s not opened (r%dw%de%d).", 14942d1661a5SPawel Jakub Dawidek cp->provider->name, cp->acr, cp->acw, cp->ace)); 14952d1661a5SPawel Jakub Dawidek g_io_request(cbp, cp); 14962d1661a5SPawel Jakub Dawidek } 14972d1661a5SPawel Jakub Dawidek break; 14982d1661a5SPawel Jakub Dawidek case BIO_WRITE: 14992d1661a5SPawel Jakub Dawidek case BIO_DELETE: 15002d1661a5SPawel Jakub Dawidek /* 15012d1661a5SPawel Jakub Dawidek * Bump syncid on first write. 15022d1661a5SPawel Jakub Dawidek */ 15032d1661a5SPawel Jakub Dawidek if (sc->sc_bump_syncid == G_RAID3_BUMP_ON_FIRST_WRITE) { 15042d1661a5SPawel Jakub Dawidek sc->sc_bump_syncid = 0; 15052d1661a5SPawel Jakub Dawidek g_topology_lock(); 15062d1661a5SPawel Jakub Dawidek g_raid3_bump_syncid(sc); 15072d1661a5SPawel Jakub Dawidek g_topology_unlock(); 15082d1661a5SPawel Jakub Dawidek } 15092d1661a5SPawel Jakub Dawidek g_raid3_scatter(pbp); 15102d1661a5SPawel Jakub Dawidek break; 15112d1661a5SPawel Jakub Dawidek } 15122d1661a5SPawel Jakub Dawidek return (0); 15132d1661a5SPawel Jakub Dawidek } 15142d1661a5SPawel Jakub Dawidek 15152d1661a5SPawel Jakub Dawidek static int 15162d1661a5SPawel Jakub Dawidek g_raid3_can_destroy(struct g_raid3_softc *sc) 15172d1661a5SPawel Jakub Dawidek { 15182d1661a5SPawel Jakub Dawidek struct g_geom *gp; 15192d1661a5SPawel Jakub Dawidek struct g_consumer *cp; 15202d1661a5SPawel Jakub Dawidek 15212d1661a5SPawel Jakub Dawidek g_topology_assert(); 15222d1661a5SPawel Jakub Dawidek gp = sc->sc_geom; 15232d1661a5SPawel Jakub Dawidek LIST_FOREACH(cp, &gp->consumer, consumer) { 15242d1661a5SPawel Jakub Dawidek if (g_raid3_is_busy(sc, cp)) 15252d1661a5SPawel Jakub Dawidek return (0); 15262d1661a5SPawel Jakub Dawidek } 15272d1661a5SPawel Jakub Dawidek gp = sc->sc_sync.ds_geom; 15282d1661a5SPawel Jakub Dawidek LIST_FOREACH(cp, &gp->consumer, consumer) { 15292d1661a5SPawel Jakub Dawidek if (g_raid3_is_busy(sc, cp)) 15302d1661a5SPawel Jakub Dawidek return (0); 15312d1661a5SPawel Jakub Dawidek } 15322d1661a5SPawel Jakub Dawidek G_RAID3_DEBUG(2, "No I/O requests for %s, it can be destroyed.", 15332d1661a5SPawel Jakub Dawidek sc->sc_name); 15342d1661a5SPawel Jakub Dawidek return (1); 15352d1661a5SPawel Jakub Dawidek } 15362d1661a5SPawel Jakub Dawidek 15372d1661a5SPawel Jakub Dawidek static int 15382d1661a5SPawel Jakub Dawidek g_raid3_try_destroy(struct g_raid3_softc *sc) 15392d1661a5SPawel Jakub Dawidek { 15402d1661a5SPawel Jakub Dawidek 15412d1661a5SPawel Jakub Dawidek if ((sc->sc_flags & G_RAID3_DEVICE_FLAG_WAIT) != 0) { 15422d1661a5SPawel Jakub Dawidek g_topology_lock(); 15432d1661a5SPawel Jakub Dawidek if (!g_raid3_can_destroy(sc)) { 15442d1661a5SPawel Jakub Dawidek g_topology_unlock(); 15452d1661a5SPawel Jakub Dawidek return (0); 15462d1661a5SPawel Jakub Dawidek } 15472d1661a5SPawel Jakub Dawidek g_topology_unlock(); 15482d1661a5SPawel Jakub Dawidek G_RAID3_DEBUG(4, "%s: Waking up %p.", __func__, 15492d1661a5SPawel Jakub Dawidek &sc->sc_worker); 15502d1661a5SPawel Jakub Dawidek wakeup(&sc->sc_worker); 15512d1661a5SPawel Jakub Dawidek sc->sc_worker = NULL; 15522d1661a5SPawel Jakub Dawidek } else { 15532d1661a5SPawel Jakub Dawidek g_topology_lock(); 15542d1661a5SPawel Jakub Dawidek if (!g_raid3_can_destroy(sc)) { 15552d1661a5SPawel Jakub Dawidek g_topology_unlock(); 15562d1661a5SPawel Jakub Dawidek return (0); 15572d1661a5SPawel Jakub Dawidek } 15582d1661a5SPawel Jakub Dawidek g_raid3_destroy_device(sc); 15592d1661a5SPawel Jakub Dawidek g_topology_unlock(); 15602d1661a5SPawel Jakub Dawidek free(sc->sc_disks, M_RAID3); 15612d1661a5SPawel Jakub Dawidek free(sc, M_RAID3); 15622d1661a5SPawel Jakub Dawidek } 15632d1661a5SPawel Jakub Dawidek return (1); 15642d1661a5SPawel Jakub Dawidek } 15652d1661a5SPawel Jakub Dawidek 15662d1661a5SPawel Jakub Dawidek /* 15672d1661a5SPawel Jakub Dawidek * Worker thread. 15682d1661a5SPawel Jakub Dawidek */ 15692d1661a5SPawel Jakub Dawidek static void 15702d1661a5SPawel Jakub Dawidek g_raid3_worker(void *arg) 15712d1661a5SPawel Jakub Dawidek { 15722d1661a5SPawel Jakub Dawidek struct g_raid3_softc *sc; 15732d1661a5SPawel Jakub Dawidek struct g_raid3_disk *disk; 15742d1661a5SPawel Jakub Dawidek struct g_raid3_event *ep; 15752d1661a5SPawel Jakub Dawidek struct bio *bp; 15762d1661a5SPawel Jakub Dawidek u_int nreqs; 15772d1661a5SPawel Jakub Dawidek 15782d1661a5SPawel Jakub Dawidek sc = arg; 15792d1661a5SPawel Jakub Dawidek curthread->td_base_pri = PRIBIO; 15802d1661a5SPawel Jakub Dawidek 15812d1661a5SPawel Jakub Dawidek nreqs = 0; 15822d1661a5SPawel Jakub Dawidek for (;;) { 15832d1661a5SPawel Jakub Dawidek G_RAID3_DEBUG(5, "%s: Let's see...", __func__); 15842d1661a5SPawel Jakub Dawidek /* 15852d1661a5SPawel Jakub Dawidek * First take a look at events. 15862d1661a5SPawel Jakub Dawidek * This is important to handle events before any I/O requests. 15872d1661a5SPawel Jakub Dawidek */ 15882d1661a5SPawel Jakub Dawidek ep = g_raid3_event_get(sc); 15892d1661a5SPawel Jakub Dawidek if (ep != NULL) { 15902d1661a5SPawel Jakub Dawidek g_topology_lock(); 15912d1661a5SPawel Jakub Dawidek if ((ep->e_flags & G_RAID3_EVENT_DEVICE) != 0) { 15922d1661a5SPawel Jakub Dawidek /* Update only device status. */ 15932d1661a5SPawel Jakub Dawidek G_RAID3_DEBUG(3, 15942d1661a5SPawel Jakub Dawidek "Running event for device %s.", 15952d1661a5SPawel Jakub Dawidek sc->sc_name); 15962d1661a5SPawel Jakub Dawidek ep->e_error = 0; 15972d1661a5SPawel Jakub Dawidek g_raid3_update_device(sc, 1); 15982d1661a5SPawel Jakub Dawidek } else { 15992d1661a5SPawel Jakub Dawidek /* Update disk status. */ 16002d1661a5SPawel Jakub Dawidek G_RAID3_DEBUG(3, "Running event for disk %s.", 16012d1661a5SPawel Jakub Dawidek g_raid3_get_diskname(ep->e_disk)); 16022d1661a5SPawel Jakub Dawidek ep->e_error = g_raid3_update_disk(ep->e_disk, 16032d1661a5SPawel Jakub Dawidek ep->e_state); 16042d1661a5SPawel Jakub Dawidek if (ep->e_error == 0) 16052d1661a5SPawel Jakub Dawidek g_raid3_update_device(sc, 0); 16062d1661a5SPawel Jakub Dawidek } 16072d1661a5SPawel Jakub Dawidek g_topology_unlock(); 16082d1661a5SPawel Jakub Dawidek if ((ep->e_flags & G_RAID3_EVENT_DONTWAIT) != 0) { 16092d1661a5SPawel Jakub Dawidek KASSERT(ep->e_error == 0, 16102d1661a5SPawel Jakub Dawidek ("Error cannot be handled.")); 16112d1661a5SPawel Jakub Dawidek g_raid3_event_free(ep); 16122d1661a5SPawel Jakub Dawidek } else { 16132d1661a5SPawel Jakub Dawidek ep->e_flags |= G_RAID3_EVENT_DONE; 16142d1661a5SPawel Jakub Dawidek G_RAID3_DEBUG(4, "%s: Waking up %p.", __func__, 16152d1661a5SPawel Jakub Dawidek ep); 16162d1661a5SPawel Jakub Dawidek mtx_lock(&sc->sc_events_mtx); 16172d1661a5SPawel Jakub Dawidek wakeup(ep); 16182d1661a5SPawel Jakub Dawidek mtx_unlock(&sc->sc_events_mtx); 16192d1661a5SPawel Jakub Dawidek } 16202d1661a5SPawel Jakub Dawidek if ((sc->sc_flags & 16212d1661a5SPawel Jakub Dawidek G_RAID3_DEVICE_FLAG_DESTROY) != 0) { 16222d1661a5SPawel Jakub Dawidek if (g_raid3_try_destroy(sc)) 16232d1661a5SPawel Jakub Dawidek kthread_exit(0); 16242d1661a5SPawel Jakub Dawidek } 16252d1661a5SPawel Jakub Dawidek G_RAID3_DEBUG(5, "%s: I'm here 1.", __func__); 16262d1661a5SPawel Jakub Dawidek continue; 16272d1661a5SPawel Jakub Dawidek } 16282d1661a5SPawel Jakub Dawidek /* 16292d1661a5SPawel Jakub Dawidek * Now I/O requests. 16302d1661a5SPawel Jakub Dawidek */ 16312d1661a5SPawel Jakub Dawidek /* Get first request from the queue. */ 16322d1661a5SPawel Jakub Dawidek mtx_lock(&sc->sc_queue_mtx); 16332d1661a5SPawel Jakub Dawidek bp = bioq_first(&sc->sc_queue); 16342d1661a5SPawel Jakub Dawidek if (bp == NULL) { 16352d1661a5SPawel Jakub Dawidek if ((sc->sc_flags & 16362d1661a5SPawel Jakub Dawidek G_RAID3_DEVICE_FLAG_DESTROY) != 0) { 16372d1661a5SPawel Jakub Dawidek mtx_unlock(&sc->sc_queue_mtx); 16382d1661a5SPawel Jakub Dawidek if (g_raid3_try_destroy(sc)) 16392d1661a5SPawel Jakub Dawidek kthread_exit(0); 16402d1661a5SPawel Jakub Dawidek mtx_lock(&sc->sc_queue_mtx); 16412d1661a5SPawel Jakub Dawidek } 16422d1661a5SPawel Jakub Dawidek } 16432d1661a5SPawel Jakub Dawidek if (sc->sc_syncdisk != NULL && 16442d1661a5SPawel Jakub Dawidek (bp == NULL || nreqs > g_raid3_reqs_per_sync)) { 16452d1661a5SPawel Jakub Dawidek mtx_unlock(&sc->sc_queue_mtx); 16462d1661a5SPawel Jakub Dawidek /* 16472d1661a5SPawel Jakub Dawidek * It is time for synchronization... 16482d1661a5SPawel Jakub Dawidek */ 16492d1661a5SPawel Jakub Dawidek nreqs = 0; 16502d1661a5SPawel Jakub Dawidek disk = sc->sc_syncdisk; 16512d1661a5SPawel Jakub Dawidek if (disk->d_sync.ds_offset < 1652c0d68b6eSPawel Jakub Dawidek sc->sc_mediasize / (sc->sc_ndisks - 1) && 16532d1661a5SPawel Jakub Dawidek disk->d_sync.ds_offset == 16542d1661a5SPawel Jakub Dawidek disk->d_sync.ds_offset_done) { 16552d1661a5SPawel Jakub Dawidek g_raid3_sync_one(sc); 16562d1661a5SPawel Jakub Dawidek } 16572d1661a5SPawel Jakub Dawidek G_RAID3_DEBUG(5, "%s: I'm here 2.", __func__); 16582d1661a5SPawel Jakub Dawidek goto sleep; 16592d1661a5SPawel Jakub Dawidek } 16602d1661a5SPawel Jakub Dawidek if (bp == NULL) { 16612d1661a5SPawel Jakub Dawidek MSLEEP(sc, &sc->sc_queue_mtx, PRIBIO | PDROP, "r3:w1", 0); 16622d1661a5SPawel Jakub Dawidek G_RAID3_DEBUG(5, "%s: I'm here 3.", __func__); 16632d1661a5SPawel Jakub Dawidek continue; 16642d1661a5SPawel Jakub Dawidek } 16652d1661a5SPawel Jakub Dawidek nreqs++; 16662d1661a5SPawel Jakub Dawidek bioq_remove(&sc->sc_queue, bp); 16672d1661a5SPawel Jakub Dawidek mtx_unlock(&sc->sc_queue_mtx); 16682d1661a5SPawel Jakub Dawidek 16692d1661a5SPawel Jakub Dawidek if ((bp->bio_cflags & G_RAID3_BIO_CFLAG_REGULAR) != 0) { 16702d1661a5SPawel Jakub Dawidek g_raid3_regular_request(bp); 16712d1661a5SPawel Jakub Dawidek } else if ((bp->bio_cflags & G_RAID3_BIO_CFLAG_SYNC) != 0) { 16722d1661a5SPawel Jakub Dawidek u_int timeout, sps; 16732d1661a5SPawel Jakub Dawidek 16742d1661a5SPawel Jakub Dawidek g_raid3_sync_request(bp); 16752d1661a5SPawel Jakub Dawidek sleep: 16762d1661a5SPawel Jakub Dawidek sps = atomic_load_acq_int(&g_raid3_syncs_per_sec); 16772d1661a5SPawel Jakub Dawidek if (sps == 0) { 16782d1661a5SPawel Jakub Dawidek G_RAID3_DEBUG(5, "%s: I'm here 5.", __func__); 16792d1661a5SPawel Jakub Dawidek continue; 16802d1661a5SPawel Jakub Dawidek } 16812d1661a5SPawel Jakub Dawidek mtx_lock(&sc->sc_queue_mtx); 16822d1661a5SPawel Jakub Dawidek if (bioq_first(&sc->sc_queue) != NULL) { 16832d1661a5SPawel Jakub Dawidek mtx_unlock(&sc->sc_queue_mtx); 16842d1661a5SPawel Jakub Dawidek G_RAID3_DEBUG(5, "%s: I'm here 4.", __func__); 16852d1661a5SPawel Jakub Dawidek continue; 16862d1661a5SPawel Jakub Dawidek } 16872d1661a5SPawel Jakub Dawidek timeout = hz / sps; 16882d1661a5SPawel Jakub Dawidek if (timeout == 0) 16892d1661a5SPawel Jakub Dawidek timeout = 1; 16902d1661a5SPawel Jakub Dawidek MSLEEP(sc, &sc->sc_queue_mtx, PRIBIO | PDROP, "r3:w2", 16912d1661a5SPawel Jakub Dawidek timeout); 16922d1661a5SPawel Jakub Dawidek } else { 16932d1661a5SPawel Jakub Dawidek if (g_raid3_register_request(bp) != 0) { 16942d1661a5SPawel Jakub Dawidek mtx_lock(&sc->sc_queue_mtx); 16952d1661a5SPawel Jakub Dawidek bioq_insert_tail(&sc->sc_queue, bp); 16962d1661a5SPawel Jakub Dawidek MSLEEP(&sc->sc_queue, &sc->sc_queue_mtx, 16972d1661a5SPawel Jakub Dawidek PRIBIO | PDROP, "r3:lowmem", hz / 10); 16982d1661a5SPawel Jakub Dawidek } 16992d1661a5SPawel Jakub Dawidek } 17002d1661a5SPawel Jakub Dawidek G_RAID3_DEBUG(5, "%s: I'm here 6.", __func__); 17012d1661a5SPawel Jakub Dawidek } 17022d1661a5SPawel Jakub Dawidek } 17032d1661a5SPawel Jakub Dawidek 17042d1661a5SPawel Jakub Dawidek /* 17052d1661a5SPawel Jakub Dawidek * Open disk's consumer if needed. 17062d1661a5SPawel Jakub Dawidek */ 17072d1661a5SPawel Jakub Dawidek static void 17082d1661a5SPawel Jakub Dawidek g_raid3_update_access(struct g_raid3_disk *disk) 17092d1661a5SPawel Jakub Dawidek { 17102d1661a5SPawel Jakub Dawidek struct g_provider *pp; 17112d1661a5SPawel Jakub Dawidek struct g_consumer *cp; 17122d1661a5SPawel Jakub Dawidek int acr, acw, ace, cpw, error; 17132d1661a5SPawel Jakub Dawidek 17142d1661a5SPawel Jakub Dawidek g_topology_assert(); 17152d1661a5SPawel Jakub Dawidek 17162d1661a5SPawel Jakub Dawidek cp = disk->d_consumer; 17172d1661a5SPawel Jakub Dawidek pp = disk->d_softc->sc_provider; 17182d1661a5SPawel Jakub Dawidek if (pp == NULL) { 17192d1661a5SPawel Jakub Dawidek acr = -cp->acr; 17202d1661a5SPawel Jakub Dawidek acw = -cp->acw; 17212d1661a5SPawel Jakub Dawidek ace = -cp->ace; 17222d1661a5SPawel Jakub Dawidek } else { 17232d1661a5SPawel Jakub Dawidek acr = pp->acr - cp->acr; 17242d1661a5SPawel Jakub Dawidek acw = pp->acw - cp->acw; 17252d1661a5SPawel Jakub Dawidek ace = pp->ace - cp->ace; 17262d1661a5SPawel Jakub Dawidek /* Grab an extra "exclusive" bit. */ 17272d1661a5SPawel Jakub Dawidek if (pp->acr > 0 || pp->acw > 0 || pp->ace > 0) 17282d1661a5SPawel Jakub Dawidek ace++; 17292d1661a5SPawel Jakub Dawidek } 17302d1661a5SPawel Jakub Dawidek if (acr == 0 && acw == 0 && ace == 0) 17312d1661a5SPawel Jakub Dawidek return; 17322d1661a5SPawel Jakub Dawidek cpw = cp->acw; 17332d1661a5SPawel Jakub Dawidek error = g_access(cp, acr, acw, ace); 17342d1661a5SPawel Jakub Dawidek G_RAID3_DEBUG(2, "Access %s r%dw%de%d = %d", cp->provider->name, acr, 17352d1661a5SPawel Jakub Dawidek acw, ace, error); 17362d1661a5SPawel Jakub Dawidek if (error != 0) { 17372d1661a5SPawel Jakub Dawidek disk->d_softc->sc_bump_syncid = G_RAID3_BUMP_ON_FIRST_WRITE; 17382d1661a5SPawel Jakub Dawidek g_raid3_event_send(disk, G_RAID3_DISK_STATE_DISCONNECTED, 17392d1661a5SPawel Jakub Dawidek G_RAID3_EVENT_DONTWAIT); 17402d1661a5SPawel Jakub Dawidek return; 17412d1661a5SPawel Jakub Dawidek } 17422d1661a5SPawel Jakub Dawidek if (cpw == 0 && cp->acw > 0) { 17432d1661a5SPawel Jakub Dawidek G_RAID3_DEBUG(1, "Disk %s (device %s) marked as dirty.", 17442d1661a5SPawel Jakub Dawidek g_raid3_get_diskname(disk), disk->d_softc->sc_name); 17452d1661a5SPawel Jakub Dawidek disk->d_flags |= G_RAID3_DISK_FLAG_DIRTY; 17462d1661a5SPawel Jakub Dawidek } else if (cpw > 0 && cp->acw == 0) { 17472d1661a5SPawel Jakub Dawidek G_RAID3_DEBUG(1, "Disk %s (device %s) marked as clean.", 17482d1661a5SPawel Jakub Dawidek g_raid3_get_diskname(disk), disk->d_softc->sc_name); 17492d1661a5SPawel Jakub Dawidek disk->d_flags &= ~G_RAID3_DISK_FLAG_DIRTY; 17502d1661a5SPawel Jakub Dawidek } 17512d1661a5SPawel Jakub Dawidek } 17522d1661a5SPawel Jakub Dawidek 17532d1661a5SPawel Jakub Dawidek static void 17542d1661a5SPawel Jakub Dawidek g_raid3_sync_start(struct g_raid3_softc *sc) 17552d1661a5SPawel Jakub Dawidek { 17562d1661a5SPawel Jakub Dawidek struct g_raid3_disk *disk; 17572d1661a5SPawel Jakub Dawidek struct g_consumer *cp; 17582d1661a5SPawel Jakub Dawidek int error; 17592d1661a5SPawel Jakub Dawidek u_int n; 17602d1661a5SPawel Jakub Dawidek 17612d1661a5SPawel Jakub Dawidek g_topology_assert(); 17622d1661a5SPawel Jakub Dawidek 17632d1661a5SPawel Jakub Dawidek KASSERT(sc->sc_state == G_RAID3_DEVICE_STATE_DEGRADED, 17642d1661a5SPawel Jakub Dawidek ("Device not in DEGRADED state (%s, %u).", sc->sc_name, 17652d1661a5SPawel Jakub Dawidek sc->sc_state)); 17662d1661a5SPawel Jakub Dawidek KASSERT(sc->sc_syncdisk == NULL, ("Syncdisk is not NULL (%s, %u).", 17672d1661a5SPawel Jakub Dawidek sc->sc_name, sc->sc_state)); 17682d1661a5SPawel Jakub Dawidek disk = NULL; 17692d1661a5SPawel Jakub Dawidek for (n = 0; n < sc->sc_ndisks; n++) { 17702d1661a5SPawel Jakub Dawidek if (sc->sc_disks[n].d_state != G_RAID3_DISK_STATE_SYNCHRONIZING) 17712d1661a5SPawel Jakub Dawidek continue; 17722d1661a5SPawel Jakub Dawidek disk = &sc->sc_disks[n]; 17732d1661a5SPawel Jakub Dawidek break; 17742d1661a5SPawel Jakub Dawidek } 17752d1661a5SPawel Jakub Dawidek if (disk == NULL) 17762d1661a5SPawel Jakub Dawidek return; 17772d1661a5SPawel Jakub Dawidek cp = disk->d_consumer; 17782d1661a5SPawel Jakub Dawidek KASSERT(cp->acr == 0 && cp->acw == 0 && cp->ace == 0, 17792d1661a5SPawel Jakub Dawidek ("Consumer %s already opened.", cp->provider->name)); 17802d1661a5SPawel Jakub Dawidek 17812d1661a5SPawel Jakub Dawidek G_RAID3_DEBUG(0, "Device %s: rebuilding provider %s.", sc->sc_name, 17822d1661a5SPawel Jakub Dawidek g_raid3_get_diskname(disk)); 17832d1661a5SPawel Jakub Dawidek error = g_access(cp, 0, 1, 1); 17842d1661a5SPawel Jakub Dawidek G_RAID3_DEBUG(2, "Access %s r%dw%de%d = %d", cp->provider->name, 0, 1, 17852d1661a5SPawel Jakub Dawidek 1, error); 17862d1661a5SPawel Jakub Dawidek if (error != 0) { 17872d1661a5SPawel Jakub Dawidek g_raid3_event_send(disk, G_RAID3_DISK_STATE_DISCONNECTED, 17882d1661a5SPawel Jakub Dawidek G_RAID3_EVENT_DONTWAIT); 17892d1661a5SPawel Jakub Dawidek return; 17902d1661a5SPawel Jakub Dawidek } 17912d1661a5SPawel Jakub Dawidek disk->d_flags |= G_RAID3_DISK_FLAG_DIRTY; 17922d1661a5SPawel Jakub Dawidek KASSERT(disk->d_sync.ds_consumer == NULL, 17932d1661a5SPawel Jakub Dawidek ("Sync consumer already exists (device=%s, disk=%s).", 17942d1661a5SPawel Jakub Dawidek sc->sc_name, g_raid3_get_diskname(disk))); 17952d1661a5SPawel Jakub Dawidek disk->d_sync.ds_consumer = g_new_consumer(sc->sc_sync.ds_geom); 17962d1661a5SPawel Jakub Dawidek disk->d_sync.ds_consumer->private = disk; 17972d1661a5SPawel Jakub Dawidek error = g_attach(disk->d_sync.ds_consumer, disk->d_softc->sc_provider); 17982d1661a5SPawel Jakub Dawidek KASSERT(error == 0, ("Cannot attach to %s (error=%d).", 17992d1661a5SPawel Jakub Dawidek disk->d_softc->sc_name, error)); 18002d1661a5SPawel Jakub Dawidek error = g_access(disk->d_sync.ds_consumer, 1, 0, 0); 18012d1661a5SPawel Jakub Dawidek KASSERT(error == 0, ("Cannot open %s (error=%d).", 18022d1661a5SPawel Jakub Dawidek disk->d_softc->sc_name, error)); 18032d1661a5SPawel Jakub Dawidek disk->d_sync.ds_data = malloc(G_RAID3_MAX_IO_SIZE, M_RAID3, M_WAITOK); 18042d1661a5SPawel Jakub Dawidek sc->sc_syncdisk = disk; 18052d1661a5SPawel Jakub Dawidek } 18062d1661a5SPawel Jakub Dawidek 18072d1661a5SPawel Jakub Dawidek /* 18082d1661a5SPawel Jakub Dawidek * Stop synchronization process. 18092d1661a5SPawel Jakub Dawidek * type: 0 - synchronization finished 18102d1661a5SPawel Jakub Dawidek * 1 - synchronization stopped 18112d1661a5SPawel Jakub Dawidek */ 18122d1661a5SPawel Jakub Dawidek static void 18132d1661a5SPawel Jakub Dawidek g_raid3_sync_stop(struct g_raid3_softc *sc, int type) 18142d1661a5SPawel Jakub Dawidek { 18152d1661a5SPawel Jakub Dawidek struct g_raid3_disk *disk; 18162d1661a5SPawel Jakub Dawidek struct g_consumer *cp; 18172d1661a5SPawel Jakub Dawidek 18182d1661a5SPawel Jakub Dawidek g_topology_assert(); 18192d1661a5SPawel Jakub Dawidek KASSERT(sc->sc_state == G_RAID3_DEVICE_STATE_DEGRADED, 18202d1661a5SPawel Jakub Dawidek ("Device not in DEGRADED state (%s, %u).", sc->sc_name, 18212d1661a5SPawel Jakub Dawidek sc->sc_state)); 18222d1661a5SPawel Jakub Dawidek disk = sc->sc_syncdisk; 18232d1661a5SPawel Jakub Dawidek sc->sc_syncdisk = NULL; 18242d1661a5SPawel Jakub Dawidek KASSERT(disk != NULL, ("No disk was synchronized (%s).", sc->sc_name)); 18252d1661a5SPawel Jakub Dawidek KASSERT(disk->d_state == G_RAID3_DISK_STATE_SYNCHRONIZING, 18262d1661a5SPawel Jakub Dawidek ("Wrong disk state (%s, %s).", g_raid3_get_diskname(disk), 18272d1661a5SPawel Jakub Dawidek g_raid3_disk_state2str(disk->d_state))); 18282d1661a5SPawel Jakub Dawidek if (disk->d_sync.ds_consumer == NULL) 18292d1661a5SPawel Jakub Dawidek return; 18302d1661a5SPawel Jakub Dawidek 18312d1661a5SPawel Jakub Dawidek if (type == 0) { 18322d1661a5SPawel Jakub Dawidek G_RAID3_DEBUG(0, "Device %s: rebuilding provider %s finished.", 18332d1661a5SPawel Jakub Dawidek disk->d_softc->sc_name, g_raid3_get_diskname(disk)); 18342d1661a5SPawel Jakub Dawidek } else /* if (type == 1) */ { 18352d1661a5SPawel Jakub Dawidek G_RAID3_DEBUG(0, "Device %s: rebuilding provider %s stopped.", 18362d1661a5SPawel Jakub Dawidek disk->d_softc->sc_name, g_raid3_get_diskname(disk)); 18372d1661a5SPawel Jakub Dawidek } 18382d1661a5SPawel Jakub Dawidek cp = disk->d_sync.ds_consumer; 18392d1661a5SPawel Jakub Dawidek g_access(cp, -1, 0, 0); 18402d1661a5SPawel Jakub Dawidek g_raid3_kill_consumer(disk->d_softc, cp); 18412d1661a5SPawel Jakub Dawidek free(disk->d_sync.ds_data, M_RAID3); 18422d1661a5SPawel Jakub Dawidek disk->d_sync.ds_consumer = NULL; 18432d1661a5SPawel Jakub Dawidek cp = disk->d_consumer; 18442d1661a5SPawel Jakub Dawidek KASSERT(cp->acr == 0 && cp->acw == 1 && cp->ace == 1, 18452d1661a5SPawel Jakub Dawidek ("Consumer %s not opened.", cp->provider->name)); 18462d1661a5SPawel Jakub Dawidek g_access(cp, 0, -1, -1); 18472d1661a5SPawel Jakub Dawidek G_RAID3_DEBUG(2, "Access %s r%dw%de%d = %d", cp->provider->name, 0, -1, 18482d1661a5SPawel Jakub Dawidek -1, 0); 18492d1661a5SPawel Jakub Dawidek disk->d_flags &= ~G_RAID3_DISK_FLAG_DIRTY; 18502d1661a5SPawel Jakub Dawidek } 18512d1661a5SPawel Jakub Dawidek 18522d1661a5SPawel Jakub Dawidek static void 18532d1661a5SPawel Jakub Dawidek g_raid3_launch_provider(struct g_raid3_softc *sc) 18542d1661a5SPawel Jakub Dawidek { 18552d1661a5SPawel Jakub Dawidek struct g_provider *pp; 18562d1661a5SPawel Jakub Dawidek 18572d1661a5SPawel Jakub Dawidek g_topology_assert(); 18582d1661a5SPawel Jakub Dawidek 18592d1661a5SPawel Jakub Dawidek pp = g_new_providerf(sc->sc_geom, "raid3/%s", sc->sc_name); 18602d1661a5SPawel Jakub Dawidek pp->mediasize = sc->sc_mediasize; 18612d1661a5SPawel Jakub Dawidek pp->sectorsize = sc->sc_sectorsize; 18622d1661a5SPawel Jakub Dawidek sc->sc_provider = pp; 18632d1661a5SPawel Jakub Dawidek g_error_provider(pp, 0); 18642d1661a5SPawel Jakub Dawidek G_RAID3_DEBUG(0, "Device %s: provider %s launched.", sc->sc_name, 18652d1661a5SPawel Jakub Dawidek pp->name); 18662d1661a5SPawel Jakub Dawidek if (sc->sc_state == G_RAID3_DEVICE_STATE_DEGRADED) 18672d1661a5SPawel Jakub Dawidek g_raid3_sync_start(sc); 18682d1661a5SPawel Jakub Dawidek } 18692d1661a5SPawel Jakub Dawidek 18702d1661a5SPawel Jakub Dawidek static void 18712d1661a5SPawel Jakub Dawidek g_raid3_destroy_provider(struct g_raid3_softc *sc) 18722d1661a5SPawel Jakub Dawidek { 18732d1661a5SPawel Jakub Dawidek struct bio *bp; 18742d1661a5SPawel Jakub Dawidek 18752d1661a5SPawel Jakub Dawidek g_topology_assert(); 18762d1661a5SPawel Jakub Dawidek KASSERT(sc->sc_provider != NULL, ("NULL provider (device=%s).", 18772d1661a5SPawel Jakub Dawidek sc->sc_name)); 18782d1661a5SPawel Jakub Dawidek 18792d1661a5SPawel Jakub Dawidek g_error_provider(sc->sc_provider, ENXIO); 18802d1661a5SPawel Jakub Dawidek mtx_lock(&sc->sc_queue_mtx); 18812d1661a5SPawel Jakub Dawidek while ((bp = bioq_first(&sc->sc_queue)) != NULL) { 18822d1661a5SPawel Jakub Dawidek bioq_remove(&sc->sc_queue, bp); 18832d1661a5SPawel Jakub Dawidek g_io_deliver(bp, ENXIO); 18842d1661a5SPawel Jakub Dawidek } 18852d1661a5SPawel Jakub Dawidek mtx_unlock(&sc->sc_queue_mtx); 18862d1661a5SPawel Jakub Dawidek G_RAID3_DEBUG(0, "Device %s: provider %s destroyed.", sc->sc_name, 18872d1661a5SPawel Jakub Dawidek sc->sc_provider->name); 18882d1661a5SPawel Jakub Dawidek sc->sc_provider->flags |= G_PF_WITHER; 18892d1661a5SPawel Jakub Dawidek g_orphan_provider(sc->sc_provider, ENXIO); 18902d1661a5SPawel Jakub Dawidek sc->sc_provider = NULL; 18912d1661a5SPawel Jakub Dawidek if (sc->sc_syncdisk != NULL) 18922d1661a5SPawel Jakub Dawidek g_raid3_sync_stop(sc, 1); 18932d1661a5SPawel Jakub Dawidek } 18942d1661a5SPawel Jakub Dawidek 18952d1661a5SPawel Jakub Dawidek static void 18962d1661a5SPawel Jakub Dawidek g_raid3_go(void *arg) 18972d1661a5SPawel Jakub Dawidek { 18982d1661a5SPawel Jakub Dawidek struct g_raid3_softc *sc; 18992d1661a5SPawel Jakub Dawidek 19002d1661a5SPawel Jakub Dawidek sc = arg; 19012d1661a5SPawel Jakub Dawidek G_RAID3_DEBUG(0, "Force device %s start due to timeout.", sc->sc_name); 19022d1661a5SPawel Jakub Dawidek g_raid3_event_send(sc, 0, 19032d1661a5SPawel Jakub Dawidek G_RAID3_EVENT_DONTWAIT | G_RAID3_EVENT_DEVICE); 19042d1661a5SPawel Jakub Dawidek } 19052d1661a5SPawel Jakub Dawidek 19062d1661a5SPawel Jakub Dawidek static u_int 19072d1661a5SPawel Jakub Dawidek g_raid3_determine_state(struct g_raid3_disk *disk) 19082d1661a5SPawel Jakub Dawidek { 19092d1661a5SPawel Jakub Dawidek struct g_raid3_softc *sc; 19102d1661a5SPawel Jakub Dawidek u_int state; 19112d1661a5SPawel Jakub Dawidek 19122d1661a5SPawel Jakub Dawidek sc = disk->d_softc; 19132d1661a5SPawel Jakub Dawidek if (sc->sc_syncid == disk->d_sync.ds_syncid) { 19142d1661a5SPawel Jakub Dawidek if ((disk->d_flags & 19152d1661a5SPawel Jakub Dawidek G_RAID3_DISK_FLAG_SYNCHRONIZING) == 0) { 19162d1661a5SPawel Jakub Dawidek /* Disk does not need synchronization. */ 19172d1661a5SPawel Jakub Dawidek state = G_RAID3_DISK_STATE_ACTIVE; 19182d1661a5SPawel Jakub Dawidek } else { 19192d1661a5SPawel Jakub Dawidek if ((sc->sc_flags & 19202d1661a5SPawel Jakub Dawidek G_RAID3_DEVICE_FLAG_NOAUTOSYNC) == 0 || 19212d1661a5SPawel Jakub Dawidek (disk->d_flags & 19222d1661a5SPawel Jakub Dawidek G_RAID3_DISK_FLAG_FORCE_SYNC) != 0) { 19232d1661a5SPawel Jakub Dawidek /* 19242d1661a5SPawel Jakub Dawidek * We can start synchronization from 19252d1661a5SPawel Jakub Dawidek * the stored offset. 19262d1661a5SPawel Jakub Dawidek */ 19272d1661a5SPawel Jakub Dawidek state = G_RAID3_DISK_STATE_SYNCHRONIZING; 19282d1661a5SPawel Jakub Dawidek } else { 19292d1661a5SPawel Jakub Dawidek state = G_RAID3_DISK_STATE_STALE; 19302d1661a5SPawel Jakub Dawidek } 19312d1661a5SPawel Jakub Dawidek } 19322d1661a5SPawel Jakub Dawidek } else if (disk->d_sync.ds_syncid < sc->sc_syncid) { 19332d1661a5SPawel Jakub Dawidek /* 19342d1661a5SPawel Jakub Dawidek * Reset all synchronization data for this disk, 19352d1661a5SPawel Jakub Dawidek * because if it even was synchronized, it was 19362d1661a5SPawel Jakub Dawidek * synchronized to disks with different syncid. 19372d1661a5SPawel Jakub Dawidek */ 19382d1661a5SPawel Jakub Dawidek disk->d_flags |= G_RAID3_DISK_FLAG_SYNCHRONIZING; 19392d1661a5SPawel Jakub Dawidek disk->d_sync.ds_offset = 0; 19402d1661a5SPawel Jakub Dawidek disk->d_sync.ds_offset_done = 0; 19412d1661a5SPawel Jakub Dawidek disk->d_sync.ds_syncid = sc->sc_syncid; 19422d1661a5SPawel Jakub Dawidek if ((sc->sc_flags & G_RAID3_DEVICE_FLAG_NOAUTOSYNC) == 0 || 19432d1661a5SPawel Jakub Dawidek (disk->d_flags & G_RAID3_DISK_FLAG_FORCE_SYNC) != 0) { 19442d1661a5SPawel Jakub Dawidek state = G_RAID3_DISK_STATE_SYNCHRONIZING; 19452d1661a5SPawel Jakub Dawidek } else { 19462d1661a5SPawel Jakub Dawidek state = G_RAID3_DISK_STATE_STALE; 19472d1661a5SPawel Jakub Dawidek } 19482d1661a5SPawel Jakub Dawidek } else /* if (sc->sc_syncid < disk->d_sync.ds_syncid) */ { 19492d1661a5SPawel Jakub Dawidek /* 19502d1661a5SPawel Jakub Dawidek * Not good, NOT GOOD! 19512d1661a5SPawel Jakub Dawidek * It means that device was started on stale disks 19522d1661a5SPawel Jakub Dawidek * and more fresh disk just arrive. 19532d1661a5SPawel Jakub Dawidek * If there were writes, device is fucked up, sorry. 19542d1661a5SPawel Jakub Dawidek * I think the best choice here is don't touch 19552d1661a5SPawel Jakub Dawidek * this disk and inform the user laudly. 19562d1661a5SPawel Jakub Dawidek */ 19572d1661a5SPawel Jakub Dawidek G_RAID3_DEBUG(0, "Device %s was started before the freshest " 19582d1661a5SPawel Jakub Dawidek "disk (%s) arrives!! It will not be connected to the " 19592d1661a5SPawel Jakub Dawidek "running device.", sc->sc_name, 19602d1661a5SPawel Jakub Dawidek g_raid3_get_diskname(disk)); 19612d1661a5SPawel Jakub Dawidek g_raid3_destroy_disk(disk); 19622d1661a5SPawel Jakub Dawidek state = G_RAID3_DISK_STATE_NONE; 19632d1661a5SPawel Jakub Dawidek /* Return immediately, because disk was destroyed. */ 19642d1661a5SPawel Jakub Dawidek return (state); 19652d1661a5SPawel Jakub Dawidek } 19662d1661a5SPawel Jakub Dawidek G_RAID3_DEBUG(3, "State for %s disk: %s.", 19672d1661a5SPawel Jakub Dawidek g_raid3_get_diskname(disk), g_raid3_disk_state2str(state)); 19682d1661a5SPawel Jakub Dawidek return (state); 19692d1661a5SPawel Jakub Dawidek } 19702d1661a5SPawel Jakub Dawidek 19712d1661a5SPawel Jakub Dawidek /* 19722d1661a5SPawel Jakub Dawidek * Update device state. 19732d1661a5SPawel Jakub Dawidek */ 19742d1661a5SPawel Jakub Dawidek static void 19752d1661a5SPawel Jakub Dawidek g_raid3_update_device(struct g_raid3_softc *sc, boolean_t force) 19762d1661a5SPawel Jakub Dawidek { 19772d1661a5SPawel Jakub Dawidek struct g_raid3_disk *disk; 19782d1661a5SPawel Jakub Dawidek u_int state; 19792d1661a5SPawel Jakub Dawidek 19802d1661a5SPawel Jakub Dawidek g_topology_assert(); 19812d1661a5SPawel Jakub Dawidek 19822d1661a5SPawel Jakub Dawidek switch (sc->sc_state) { 19832d1661a5SPawel Jakub Dawidek case G_RAID3_DEVICE_STATE_STARTING: 19842d1661a5SPawel Jakub Dawidek { 19852d1661a5SPawel Jakub Dawidek u_int n, ndirty, ndisks, syncid; 19862d1661a5SPawel Jakub Dawidek 19872d1661a5SPawel Jakub Dawidek KASSERT(sc->sc_provider == NULL, 19882d1661a5SPawel Jakub Dawidek ("Non-NULL provider in STARTING state (%s).", sc->sc_name)); 19892d1661a5SPawel Jakub Dawidek /* 19902d1661a5SPawel Jakub Dawidek * Are we ready? We are, if all disks are connected or 19912d1661a5SPawel Jakub Dawidek * one disk is missing and 'force' is true. 19922d1661a5SPawel Jakub Dawidek */ 19932d1661a5SPawel Jakub Dawidek if (g_raid3_ndisks(sc, -1) + force == sc->sc_ndisks) { 19942d1661a5SPawel Jakub Dawidek if (!force) 19952d1661a5SPawel Jakub Dawidek callout_drain(&sc->sc_callout); 19962d1661a5SPawel Jakub Dawidek } else { 19972d1661a5SPawel Jakub Dawidek if (force) { 19982d1661a5SPawel Jakub Dawidek /* 19992d1661a5SPawel Jakub Dawidek * Timeout expired, so destroy device. 20002d1661a5SPawel Jakub Dawidek */ 20012d1661a5SPawel Jakub Dawidek sc->sc_flags |= G_RAID3_DEVICE_FLAG_DESTROY; 20022d1661a5SPawel Jakub Dawidek } 20032d1661a5SPawel Jakub Dawidek return; 20042d1661a5SPawel Jakub Dawidek } 20052d1661a5SPawel Jakub Dawidek 20062d1661a5SPawel Jakub Dawidek /* 20072d1661a5SPawel Jakub Dawidek * There must be at least 'sc->sc_ndisks - 1' components 20082d1661a5SPawel Jakub Dawidek * with the same syncid and without SYNCHRONIZING flag. 20092d1661a5SPawel Jakub Dawidek */ 20102d1661a5SPawel Jakub Dawidek 20112d1661a5SPawel Jakub Dawidek /* 20122d1661a5SPawel Jakub Dawidek * Find the biggest syncid, number of valid components and 20132d1661a5SPawel Jakub Dawidek * number of dirty components. 20142d1661a5SPawel Jakub Dawidek */ 20152d1661a5SPawel Jakub Dawidek ndirty = ndisks = syncid = 0; 20162d1661a5SPawel Jakub Dawidek for (n = 0; n < sc->sc_ndisks; n++) { 20172d1661a5SPawel Jakub Dawidek disk = &sc->sc_disks[n]; 20182d1661a5SPawel Jakub Dawidek if (disk->d_state == G_RAID3_DISK_STATE_NODISK) 20192d1661a5SPawel Jakub Dawidek continue; 20202d1661a5SPawel Jakub Dawidek if ((disk->d_flags & G_RAID3_DISK_FLAG_DIRTY) != 0) 20212d1661a5SPawel Jakub Dawidek ndirty++; 20222d1661a5SPawel Jakub Dawidek if (disk->d_sync.ds_syncid > syncid) { 20232d1661a5SPawel Jakub Dawidek syncid = disk->d_sync.ds_syncid; 20242d1661a5SPawel Jakub Dawidek ndisks = 0; 20252d1661a5SPawel Jakub Dawidek } else if (disk->d_sync.ds_syncid < syncid) { 20262d1661a5SPawel Jakub Dawidek continue; 20272d1661a5SPawel Jakub Dawidek } 20282d1661a5SPawel Jakub Dawidek if ((disk->d_flags & 20292d1661a5SPawel Jakub Dawidek G_RAID3_DISK_FLAG_SYNCHRONIZING) != 0) { 20302d1661a5SPawel Jakub Dawidek continue; 20312d1661a5SPawel Jakub Dawidek } 20322d1661a5SPawel Jakub Dawidek ndisks++; 20332d1661a5SPawel Jakub Dawidek } 20342d1661a5SPawel Jakub Dawidek /* 20352d1661a5SPawel Jakub Dawidek * Do we have enough valid components? 20362d1661a5SPawel Jakub Dawidek */ 20372d1661a5SPawel Jakub Dawidek if (ndisks + 1 < sc->sc_ndisks) { 20382d1661a5SPawel Jakub Dawidek G_RAID3_DEBUG(0, 20392d1661a5SPawel Jakub Dawidek "Device %s is broken, too few valid components.", 20402d1661a5SPawel Jakub Dawidek sc->sc_name); 20412d1661a5SPawel Jakub Dawidek sc->sc_flags |= G_RAID3_DEVICE_FLAG_DESTROY; 20422d1661a5SPawel Jakub Dawidek return; 20432d1661a5SPawel Jakub Dawidek } 20442d1661a5SPawel Jakub Dawidek /* 20452d1661a5SPawel Jakub Dawidek * If there is one DIRTY component and all disks are present, 20462d1661a5SPawel Jakub Dawidek * mark it for synchronization. If there is more than one DIRTY 20472d1661a5SPawel Jakub Dawidek * component, mark parity component for synchronization. 20482d1661a5SPawel Jakub Dawidek */ 20492d1661a5SPawel Jakub Dawidek if (ndisks == sc->sc_ndisks && ndirty == 1) { 20502d1661a5SPawel Jakub Dawidek for (n = 0; n < sc->sc_ndisks; n++) { 20512d1661a5SPawel Jakub Dawidek disk = &sc->sc_disks[n]; 20522d1661a5SPawel Jakub Dawidek if ((disk->d_flags & 20532d1661a5SPawel Jakub Dawidek G_RAID3_DISK_FLAG_DIRTY) == 0) { 20542d1661a5SPawel Jakub Dawidek continue; 20552d1661a5SPawel Jakub Dawidek } 20562d1661a5SPawel Jakub Dawidek disk->d_flags |= 20572d1661a5SPawel Jakub Dawidek G_RAID3_DISK_FLAG_SYNCHRONIZING; 20582d1661a5SPawel Jakub Dawidek } 20592d1661a5SPawel Jakub Dawidek } else if (ndisks == sc->sc_ndisks && ndirty > 1) { 20602d1661a5SPawel Jakub Dawidek disk = &sc->sc_disks[sc->sc_ndisks - 1]; 20612d1661a5SPawel Jakub Dawidek disk->d_flags |= G_RAID3_DISK_FLAG_SYNCHRONIZING; 20622d1661a5SPawel Jakub Dawidek } 20632d1661a5SPawel Jakub Dawidek 20642d1661a5SPawel Jakub Dawidek sc->sc_syncid = syncid; 20652d1661a5SPawel Jakub Dawidek if (force) { 20662d1661a5SPawel Jakub Dawidek /* Remember to bump syncid on first write. */ 20672d1661a5SPawel Jakub Dawidek sc->sc_bump_syncid = G_RAID3_BUMP_ON_FIRST_WRITE; 20682d1661a5SPawel Jakub Dawidek } 20692d1661a5SPawel Jakub Dawidek if (ndisks == sc->sc_ndisks) 20702d1661a5SPawel Jakub Dawidek state = G_RAID3_DEVICE_STATE_COMPLETE; 20712d1661a5SPawel Jakub Dawidek else /* if (ndisks == sc->sc_ndisks - 1) */ 20722d1661a5SPawel Jakub Dawidek state = G_RAID3_DEVICE_STATE_DEGRADED; 20732d1661a5SPawel Jakub Dawidek G_RAID3_DEBUG(1, "Device %s state changed from %s to %s.", 20742d1661a5SPawel Jakub Dawidek sc->sc_name, g_raid3_device_state2str(sc->sc_state), 20752d1661a5SPawel Jakub Dawidek g_raid3_device_state2str(state)); 20762d1661a5SPawel Jakub Dawidek sc->sc_state = state; 20772d1661a5SPawel Jakub Dawidek for (n = 0; n < sc->sc_ndisks; n++) { 20782d1661a5SPawel Jakub Dawidek disk = &sc->sc_disks[n]; 20792d1661a5SPawel Jakub Dawidek if (disk->d_state == G_RAID3_DISK_STATE_NODISK) 20802d1661a5SPawel Jakub Dawidek continue; 20812d1661a5SPawel Jakub Dawidek state = g_raid3_determine_state(disk); 20822d1661a5SPawel Jakub Dawidek g_raid3_event_send(disk, state, G_RAID3_EVENT_DONTWAIT); 20832d1661a5SPawel Jakub Dawidek if (state == G_RAID3_DISK_STATE_STALE) { 20842d1661a5SPawel Jakub Dawidek sc->sc_bump_syncid = 20852d1661a5SPawel Jakub Dawidek G_RAID3_BUMP_ON_FIRST_WRITE; 20862d1661a5SPawel Jakub Dawidek } 20872d1661a5SPawel Jakub Dawidek } 20882d1661a5SPawel Jakub Dawidek break; 20892d1661a5SPawel Jakub Dawidek } 20902d1661a5SPawel Jakub Dawidek case G_RAID3_DEVICE_STATE_DEGRADED: 20912d1661a5SPawel Jakub Dawidek /* 20922d1661a5SPawel Jakub Dawidek * Bump syncid here, if we need to do it immediately. 20932d1661a5SPawel Jakub Dawidek */ 20942d1661a5SPawel Jakub Dawidek if (sc->sc_bump_syncid == G_RAID3_BUMP_IMMEDIATELY) { 20952d1661a5SPawel Jakub Dawidek sc->sc_bump_syncid = 0; 20962d1661a5SPawel Jakub Dawidek g_raid3_bump_syncid(sc); 20972d1661a5SPawel Jakub Dawidek } 20982d1661a5SPawel Jakub Dawidek if (g_raid3_ndisks(sc, G_RAID3_DISK_STATE_NEW) > 0) 20992d1661a5SPawel Jakub Dawidek return; 21002d1661a5SPawel Jakub Dawidek if (g_raid3_ndisks(sc, G_RAID3_DISK_STATE_ACTIVE) < 21012d1661a5SPawel Jakub Dawidek sc->sc_ndisks - 1) { 21022d1661a5SPawel Jakub Dawidek if (sc->sc_provider != NULL) 21032d1661a5SPawel Jakub Dawidek g_raid3_destroy_provider(sc); 21042d1661a5SPawel Jakub Dawidek sc->sc_flags |= G_RAID3_DEVICE_FLAG_DESTROY; 21052d1661a5SPawel Jakub Dawidek return; 21062d1661a5SPawel Jakub Dawidek } 21072d1661a5SPawel Jakub Dawidek if (g_raid3_ndisks(sc, G_RAID3_DISK_STATE_ACTIVE) == 21082d1661a5SPawel Jakub Dawidek sc->sc_ndisks) { 21092d1661a5SPawel Jakub Dawidek state = G_RAID3_DEVICE_STATE_COMPLETE; 21102d1661a5SPawel Jakub Dawidek G_RAID3_DEBUG(1, 21112d1661a5SPawel Jakub Dawidek "Device %s state changed from %s to %s.", 21122d1661a5SPawel Jakub Dawidek sc->sc_name, g_raid3_device_state2str(sc->sc_state), 21132d1661a5SPawel Jakub Dawidek g_raid3_device_state2str(state)); 21142d1661a5SPawel Jakub Dawidek sc->sc_state = state; 21152d1661a5SPawel Jakub Dawidek } 21162d1661a5SPawel Jakub Dawidek if (sc->sc_provider == NULL) 21172d1661a5SPawel Jakub Dawidek g_raid3_launch_provider(sc); 21182d1661a5SPawel Jakub Dawidek break; 21192d1661a5SPawel Jakub Dawidek case G_RAID3_DEVICE_STATE_COMPLETE: 21202d1661a5SPawel Jakub Dawidek /* 21212d1661a5SPawel Jakub Dawidek * Bump syncid here, if we need to do it immediately. 21222d1661a5SPawel Jakub Dawidek */ 21232d1661a5SPawel Jakub Dawidek if (sc->sc_bump_syncid == G_RAID3_BUMP_IMMEDIATELY) { 21242d1661a5SPawel Jakub Dawidek sc->sc_bump_syncid = 0; 21252d1661a5SPawel Jakub Dawidek g_raid3_bump_syncid(sc); 21262d1661a5SPawel Jakub Dawidek } 21272d1661a5SPawel Jakub Dawidek if (g_raid3_ndisks(sc, G_RAID3_DISK_STATE_NEW) > 0) 21282d1661a5SPawel Jakub Dawidek return; 21292d1661a5SPawel Jakub Dawidek KASSERT(g_raid3_ndisks(sc, G_RAID3_DISK_STATE_ACTIVE) >= 21302d1661a5SPawel Jakub Dawidek sc->sc_ndisks - 1, 21312d1661a5SPawel Jakub Dawidek ("Too few ACTIVE components in COMPLETE state (device %s).", 21322d1661a5SPawel Jakub Dawidek sc->sc_name)); 21332d1661a5SPawel Jakub Dawidek if (g_raid3_ndisks(sc, G_RAID3_DISK_STATE_ACTIVE) == 21342d1661a5SPawel Jakub Dawidek sc->sc_ndisks - 1) { 21352d1661a5SPawel Jakub Dawidek state = G_RAID3_DEVICE_STATE_DEGRADED; 21362d1661a5SPawel Jakub Dawidek G_RAID3_DEBUG(1, 21372d1661a5SPawel Jakub Dawidek "Device %s state changed from %s to %s.", 21382d1661a5SPawel Jakub Dawidek sc->sc_name, g_raid3_device_state2str(sc->sc_state), 21392d1661a5SPawel Jakub Dawidek g_raid3_device_state2str(state)); 21402d1661a5SPawel Jakub Dawidek sc->sc_state = state; 21412d1661a5SPawel Jakub Dawidek } 21422d1661a5SPawel Jakub Dawidek if (sc->sc_provider == NULL) 21432d1661a5SPawel Jakub Dawidek g_raid3_launch_provider(sc); 21442d1661a5SPawel Jakub Dawidek break; 21452d1661a5SPawel Jakub Dawidek default: 21462d1661a5SPawel Jakub Dawidek KASSERT(1 == 0, ("Wrong device state (%s, %s).", sc->sc_name, 21472d1661a5SPawel Jakub Dawidek g_raid3_device_state2str(sc->sc_state))); 21482d1661a5SPawel Jakub Dawidek break; 21492d1661a5SPawel Jakub Dawidek } 21502d1661a5SPawel Jakub Dawidek } 21512d1661a5SPawel Jakub Dawidek 21522d1661a5SPawel Jakub Dawidek /* 21532d1661a5SPawel Jakub Dawidek * Update disk state and device state if needed. 21542d1661a5SPawel Jakub Dawidek */ 21552d1661a5SPawel Jakub Dawidek #define DISK_STATE_CHANGED() G_RAID3_DEBUG(1, \ 21562d1661a5SPawel Jakub Dawidek "Disk %s state changed from %s to %s (device %s).", \ 21572d1661a5SPawel Jakub Dawidek g_raid3_get_diskname(disk), \ 21582d1661a5SPawel Jakub Dawidek g_raid3_disk_state2str(disk->d_state), \ 21592d1661a5SPawel Jakub Dawidek g_raid3_disk_state2str(state), sc->sc_name) 21602d1661a5SPawel Jakub Dawidek static int 21612d1661a5SPawel Jakub Dawidek g_raid3_update_disk(struct g_raid3_disk *disk, u_int state) 21622d1661a5SPawel Jakub Dawidek { 21632d1661a5SPawel Jakub Dawidek struct g_raid3_softc *sc; 21642d1661a5SPawel Jakub Dawidek 21652d1661a5SPawel Jakub Dawidek g_topology_assert(); 21662d1661a5SPawel Jakub Dawidek 21672d1661a5SPawel Jakub Dawidek sc = disk->d_softc; 21682d1661a5SPawel Jakub Dawidek again: 21692d1661a5SPawel Jakub Dawidek G_RAID3_DEBUG(3, "Changing disk %s state from %s to %s.", 21702d1661a5SPawel Jakub Dawidek g_raid3_get_diskname(disk), g_raid3_disk_state2str(disk->d_state), 21712d1661a5SPawel Jakub Dawidek g_raid3_disk_state2str(state)); 21722d1661a5SPawel Jakub Dawidek switch (state) { 21732d1661a5SPawel Jakub Dawidek case G_RAID3_DISK_STATE_NEW: 21742d1661a5SPawel Jakub Dawidek /* 21752d1661a5SPawel Jakub Dawidek * Possible scenarios: 21762d1661a5SPawel Jakub Dawidek * 1. New disk arrive. 21772d1661a5SPawel Jakub Dawidek */ 21782d1661a5SPawel Jakub Dawidek /* Previous state should be NONE. */ 21792d1661a5SPawel Jakub Dawidek KASSERT(disk->d_state == G_RAID3_DISK_STATE_NONE, 21802d1661a5SPawel Jakub Dawidek ("Wrong disk state (%s, %s).", g_raid3_get_diskname(disk), 21812d1661a5SPawel Jakub Dawidek g_raid3_disk_state2str(disk->d_state))); 21822d1661a5SPawel Jakub Dawidek DISK_STATE_CHANGED(); 21832d1661a5SPawel Jakub Dawidek 21842d1661a5SPawel Jakub Dawidek disk->d_state = state; 21852d1661a5SPawel Jakub Dawidek G_RAID3_DEBUG(0, "Device %s: provider %s detected.", 21862d1661a5SPawel Jakub Dawidek sc->sc_name, g_raid3_get_diskname(disk)); 21872d1661a5SPawel Jakub Dawidek if (sc->sc_state == G_RAID3_DEVICE_STATE_STARTING) 21882d1661a5SPawel Jakub Dawidek break; 21892d1661a5SPawel Jakub Dawidek KASSERT(sc->sc_state == G_RAID3_DEVICE_STATE_DEGRADED || 21902d1661a5SPawel Jakub Dawidek sc->sc_state == G_RAID3_DEVICE_STATE_COMPLETE, 21912d1661a5SPawel Jakub Dawidek ("Wrong device state (%s, %s, %s, %s).", sc->sc_name, 21922d1661a5SPawel Jakub Dawidek g_raid3_device_state2str(sc->sc_state), 21932d1661a5SPawel Jakub Dawidek g_raid3_get_diskname(disk), 21942d1661a5SPawel Jakub Dawidek g_raid3_disk_state2str(disk->d_state))); 21952d1661a5SPawel Jakub Dawidek state = g_raid3_determine_state(disk); 21962d1661a5SPawel Jakub Dawidek if (state != G_RAID3_DISK_STATE_NONE) 21972d1661a5SPawel Jakub Dawidek goto again; 21982d1661a5SPawel Jakub Dawidek break; 21992d1661a5SPawel Jakub Dawidek case G_RAID3_DISK_STATE_ACTIVE: 22002d1661a5SPawel Jakub Dawidek /* 22012d1661a5SPawel Jakub Dawidek * Possible scenarios: 22022d1661a5SPawel Jakub Dawidek * 1. New disk does not need synchronization. 22032d1661a5SPawel Jakub Dawidek * 2. Synchronization process finished successfully. 22042d1661a5SPawel Jakub Dawidek */ 22052d1661a5SPawel Jakub Dawidek KASSERT(sc->sc_state == G_RAID3_DEVICE_STATE_DEGRADED || 22062d1661a5SPawel Jakub Dawidek sc->sc_state == G_RAID3_DEVICE_STATE_COMPLETE, 22072d1661a5SPawel Jakub Dawidek ("Wrong device state (%s, %s, %s, %s).", sc->sc_name, 22082d1661a5SPawel Jakub Dawidek g_raid3_device_state2str(sc->sc_state), 22092d1661a5SPawel Jakub Dawidek g_raid3_get_diskname(disk), 22102d1661a5SPawel Jakub Dawidek g_raid3_disk_state2str(disk->d_state))); 22112d1661a5SPawel Jakub Dawidek /* Previous state should be NEW or SYNCHRONIZING. */ 22122d1661a5SPawel Jakub Dawidek KASSERT(disk->d_state == G_RAID3_DISK_STATE_NEW || 22132d1661a5SPawel Jakub Dawidek disk->d_state == G_RAID3_DISK_STATE_SYNCHRONIZING, 22142d1661a5SPawel Jakub Dawidek ("Wrong disk state (%s, %s).", g_raid3_get_diskname(disk), 22152d1661a5SPawel Jakub Dawidek g_raid3_disk_state2str(disk->d_state))); 22162d1661a5SPawel Jakub Dawidek DISK_STATE_CHANGED(); 22172d1661a5SPawel Jakub Dawidek 22182d1661a5SPawel Jakub Dawidek if (disk->d_state == G_RAID3_DISK_STATE_NEW) 22192d1661a5SPawel Jakub Dawidek disk->d_flags &= ~G_RAID3_DISK_FLAG_DIRTY; 22202d1661a5SPawel Jakub Dawidek else if (disk->d_state == G_RAID3_DISK_STATE_SYNCHRONIZING) { 22212d1661a5SPawel Jakub Dawidek disk->d_flags &= ~G_RAID3_DISK_FLAG_SYNCHRONIZING; 22222d1661a5SPawel Jakub Dawidek disk->d_flags &= ~G_RAID3_DISK_FLAG_FORCE_SYNC; 22232d1661a5SPawel Jakub Dawidek g_raid3_sync_stop(sc, 0); 22242d1661a5SPawel Jakub Dawidek } 22252d1661a5SPawel Jakub Dawidek disk->d_state = state; 22262d1661a5SPawel Jakub Dawidek disk->d_sync.ds_offset = 0; 22272d1661a5SPawel Jakub Dawidek disk->d_sync.ds_offset_done = 0; 22282d1661a5SPawel Jakub Dawidek g_raid3_update_access(disk); 22292d1661a5SPawel Jakub Dawidek g_raid3_update_metadata(disk); 22302d1661a5SPawel Jakub Dawidek G_RAID3_DEBUG(0, "Device %s: provider %s activated.", 22312d1661a5SPawel Jakub Dawidek sc->sc_name, g_raid3_get_diskname(disk)); 22322d1661a5SPawel Jakub Dawidek break; 22332d1661a5SPawel Jakub Dawidek case G_RAID3_DISK_STATE_STALE: 22342d1661a5SPawel Jakub Dawidek /* 22352d1661a5SPawel Jakub Dawidek * Possible scenarios: 22362d1661a5SPawel Jakub Dawidek * 1. Stale disk was connected. 22372d1661a5SPawel Jakub Dawidek */ 22382d1661a5SPawel Jakub Dawidek /* Previous state should be NEW. */ 22392d1661a5SPawel Jakub Dawidek KASSERT(disk->d_state == G_RAID3_DISK_STATE_NEW, 22402d1661a5SPawel Jakub Dawidek ("Wrong disk state (%s, %s).", g_raid3_get_diskname(disk), 22412d1661a5SPawel Jakub Dawidek g_raid3_disk_state2str(disk->d_state))); 22422d1661a5SPawel Jakub Dawidek KASSERT(sc->sc_state == G_RAID3_DEVICE_STATE_DEGRADED || 22432d1661a5SPawel Jakub Dawidek sc->sc_state == G_RAID3_DEVICE_STATE_COMPLETE, 22442d1661a5SPawel Jakub Dawidek ("Wrong device state (%s, %s, %s, %s).", sc->sc_name, 22452d1661a5SPawel Jakub Dawidek g_raid3_device_state2str(sc->sc_state), 22462d1661a5SPawel Jakub Dawidek g_raid3_get_diskname(disk), 22472d1661a5SPawel Jakub Dawidek g_raid3_disk_state2str(disk->d_state))); 22482d1661a5SPawel Jakub Dawidek /* 22492d1661a5SPawel Jakub Dawidek * STALE state is only possible if device is marked 22502d1661a5SPawel Jakub Dawidek * NOAUTOSYNC. 22512d1661a5SPawel Jakub Dawidek */ 22522d1661a5SPawel Jakub Dawidek KASSERT((sc->sc_flags & G_RAID3_DEVICE_FLAG_NOAUTOSYNC) != 0, 22532d1661a5SPawel Jakub Dawidek ("Wrong device state (%s, %s, %s, %s).", sc->sc_name, 22542d1661a5SPawel Jakub Dawidek g_raid3_device_state2str(sc->sc_state), 22552d1661a5SPawel Jakub Dawidek g_raid3_get_diskname(disk), 22562d1661a5SPawel Jakub Dawidek g_raid3_disk_state2str(disk->d_state))); 22572d1661a5SPawel Jakub Dawidek DISK_STATE_CHANGED(); 22582d1661a5SPawel Jakub Dawidek 22592d1661a5SPawel Jakub Dawidek disk->d_flags &= ~G_RAID3_DISK_FLAG_DIRTY; 22602d1661a5SPawel Jakub Dawidek disk->d_state = state; 22612d1661a5SPawel Jakub Dawidek g_raid3_update_metadata(disk); 22622d1661a5SPawel Jakub Dawidek G_RAID3_DEBUG(0, "Device %s: provider %s is stale.", 22632d1661a5SPawel Jakub Dawidek sc->sc_name, g_raid3_get_diskname(disk)); 22642d1661a5SPawel Jakub Dawidek break; 22652d1661a5SPawel Jakub Dawidek case G_RAID3_DISK_STATE_SYNCHRONIZING: 22662d1661a5SPawel Jakub Dawidek /* 22672d1661a5SPawel Jakub Dawidek * Possible scenarios: 22682d1661a5SPawel Jakub Dawidek * 1. Disk which needs synchronization was connected. 22692d1661a5SPawel Jakub Dawidek */ 22702d1661a5SPawel Jakub Dawidek /* Previous state should be NEW. */ 22712d1661a5SPawel Jakub Dawidek KASSERT(disk->d_state == G_RAID3_DISK_STATE_NEW, 22722d1661a5SPawel Jakub Dawidek ("Wrong disk state (%s, %s).", g_raid3_get_diskname(disk), 22732d1661a5SPawel Jakub Dawidek g_raid3_disk_state2str(disk->d_state))); 22742d1661a5SPawel Jakub Dawidek KASSERT(sc->sc_state == G_RAID3_DEVICE_STATE_DEGRADED || 22752d1661a5SPawel Jakub Dawidek sc->sc_state == G_RAID3_DEVICE_STATE_COMPLETE, 22762d1661a5SPawel Jakub Dawidek ("Wrong device state (%s, %s, %s, %s).", sc->sc_name, 22772d1661a5SPawel Jakub Dawidek g_raid3_device_state2str(sc->sc_state), 22782d1661a5SPawel Jakub Dawidek g_raid3_get_diskname(disk), 22792d1661a5SPawel Jakub Dawidek g_raid3_disk_state2str(disk->d_state))); 22802d1661a5SPawel Jakub Dawidek DISK_STATE_CHANGED(); 22812d1661a5SPawel Jakub Dawidek 22822d1661a5SPawel Jakub Dawidek if (disk->d_state == G_RAID3_DISK_STATE_NEW) 22832d1661a5SPawel Jakub Dawidek disk->d_flags &= ~G_RAID3_DISK_FLAG_DIRTY; 22842d1661a5SPawel Jakub Dawidek disk->d_state = state; 22852d1661a5SPawel Jakub Dawidek if (sc->sc_provider != NULL) { 22862d1661a5SPawel Jakub Dawidek g_raid3_sync_start(sc); 22872d1661a5SPawel Jakub Dawidek g_raid3_update_metadata(disk); 22882d1661a5SPawel Jakub Dawidek } 22892d1661a5SPawel Jakub Dawidek break; 22902d1661a5SPawel Jakub Dawidek case G_RAID3_DISK_STATE_DISCONNECTED: 22912d1661a5SPawel Jakub Dawidek /* 22922d1661a5SPawel Jakub Dawidek * Possible scenarios: 22932d1661a5SPawel Jakub Dawidek * 1. Device wasn't running yet, but disk disappear. 22942d1661a5SPawel Jakub Dawidek * 2. Disk was active and disapppear. 22952d1661a5SPawel Jakub Dawidek * 3. Disk disappear during synchronization process. 22962d1661a5SPawel Jakub Dawidek */ 22972d1661a5SPawel Jakub Dawidek if (sc->sc_state == G_RAID3_DEVICE_STATE_DEGRADED || 22982d1661a5SPawel Jakub Dawidek sc->sc_state == G_RAID3_DEVICE_STATE_COMPLETE) { 22992d1661a5SPawel Jakub Dawidek /* 23002d1661a5SPawel Jakub Dawidek * Previous state should be ACTIVE, STALE or 23012d1661a5SPawel Jakub Dawidek * SYNCHRONIZING. 23022d1661a5SPawel Jakub Dawidek */ 23032d1661a5SPawel Jakub Dawidek KASSERT(disk->d_state == G_RAID3_DISK_STATE_ACTIVE || 23042d1661a5SPawel Jakub Dawidek disk->d_state == G_RAID3_DISK_STATE_STALE || 23052d1661a5SPawel Jakub Dawidek disk->d_state == G_RAID3_DISK_STATE_SYNCHRONIZING, 23062d1661a5SPawel Jakub Dawidek ("Wrong disk state (%s, %s).", 23072d1661a5SPawel Jakub Dawidek g_raid3_get_diskname(disk), 23082d1661a5SPawel Jakub Dawidek g_raid3_disk_state2str(disk->d_state))); 23092d1661a5SPawel Jakub Dawidek } else if (sc->sc_state == G_RAID3_DEVICE_STATE_STARTING) { 23102d1661a5SPawel Jakub Dawidek /* Previous state should be NEW. */ 23112d1661a5SPawel Jakub Dawidek KASSERT(disk->d_state == G_RAID3_DISK_STATE_NEW, 23122d1661a5SPawel Jakub Dawidek ("Wrong disk state (%s, %s).", 23132d1661a5SPawel Jakub Dawidek g_raid3_get_diskname(disk), 23142d1661a5SPawel Jakub Dawidek g_raid3_disk_state2str(disk->d_state))); 23152d1661a5SPawel Jakub Dawidek /* 23162d1661a5SPawel Jakub Dawidek * Reset bumping syncid if disk disappeared in STARTING 23172d1661a5SPawel Jakub Dawidek * state. 23182d1661a5SPawel Jakub Dawidek */ 23192d1661a5SPawel Jakub Dawidek if (sc->sc_bump_syncid == G_RAID3_BUMP_ON_FIRST_WRITE) 23202d1661a5SPawel Jakub Dawidek sc->sc_bump_syncid = 0; 23212d1661a5SPawel Jakub Dawidek #ifdef INVARIANTS 23222d1661a5SPawel Jakub Dawidek } else { 23232d1661a5SPawel Jakub Dawidek KASSERT(1 == 0, ("Wrong device state (%s, %s, %s, %s).", 23242d1661a5SPawel Jakub Dawidek sc->sc_name, 23252d1661a5SPawel Jakub Dawidek g_raid3_device_state2str(sc->sc_state), 23262d1661a5SPawel Jakub Dawidek g_raid3_get_diskname(disk), 23272d1661a5SPawel Jakub Dawidek g_raid3_disk_state2str(disk->d_state))); 23282d1661a5SPawel Jakub Dawidek #endif 23292d1661a5SPawel Jakub Dawidek } 23302d1661a5SPawel Jakub Dawidek DISK_STATE_CHANGED(); 23312d1661a5SPawel Jakub Dawidek G_RAID3_DEBUG(0, "Device %s: provider %s disconnected.", 23322d1661a5SPawel Jakub Dawidek sc->sc_name, g_raid3_get_diskname(disk)); 23332d1661a5SPawel Jakub Dawidek 23342d1661a5SPawel Jakub Dawidek g_raid3_destroy_disk(disk); 23352d1661a5SPawel Jakub Dawidek break; 23362d1661a5SPawel Jakub Dawidek default: 23372d1661a5SPawel Jakub Dawidek KASSERT(1 == 0, ("Unknown state (%u).", state)); 23382d1661a5SPawel Jakub Dawidek break; 23392d1661a5SPawel Jakub Dawidek } 23402d1661a5SPawel Jakub Dawidek return (0); 23412d1661a5SPawel Jakub Dawidek } 23422d1661a5SPawel Jakub Dawidek #undef DISK_STATE_CHANGED 23432d1661a5SPawel Jakub Dawidek 23442d1661a5SPawel Jakub Dawidek static int 23452d1661a5SPawel Jakub Dawidek g_raid3_read_metadata(struct g_consumer *cp, struct g_raid3_metadata *md) 23462d1661a5SPawel Jakub Dawidek { 23472d1661a5SPawel Jakub Dawidek struct g_provider *pp; 23482d1661a5SPawel Jakub Dawidek u_char *buf; 23492d1661a5SPawel Jakub Dawidek int error; 23502d1661a5SPawel Jakub Dawidek 23512d1661a5SPawel Jakub Dawidek g_topology_assert(); 23522d1661a5SPawel Jakub Dawidek 23532d1661a5SPawel Jakub Dawidek error = g_access(cp, 1, 0, 0); 23542d1661a5SPawel Jakub Dawidek if (error != 0) 23552d1661a5SPawel Jakub Dawidek return (error); 23562d1661a5SPawel Jakub Dawidek pp = cp->provider; 23572d1661a5SPawel Jakub Dawidek g_topology_unlock(); 23582d1661a5SPawel Jakub Dawidek /* Metadata are stored on last sector. */ 23592d1661a5SPawel Jakub Dawidek buf = g_read_data(cp, pp->mediasize - pp->sectorsize, pp->sectorsize, 23602d1661a5SPawel Jakub Dawidek &error); 23612d1661a5SPawel Jakub Dawidek g_topology_lock(); 23622d1661a5SPawel Jakub Dawidek if (buf == NULL) { 23632d1661a5SPawel Jakub Dawidek g_access(cp, -1, 0, 0); 23642d1661a5SPawel Jakub Dawidek return (error); 23652d1661a5SPawel Jakub Dawidek } 23662d1661a5SPawel Jakub Dawidek if (error != 0) { 23672d1661a5SPawel Jakub Dawidek g_access(cp, -1, 0, 0); 23682d1661a5SPawel Jakub Dawidek g_free(buf); 23692d1661a5SPawel Jakub Dawidek return (error); 23702d1661a5SPawel Jakub Dawidek } 23712d1661a5SPawel Jakub Dawidek error = g_access(cp, -1, 0, 0); 23722d1661a5SPawel Jakub Dawidek KASSERT(error == 0, ("Cannot decrease access count for %s.", pp->name)); 23732d1661a5SPawel Jakub Dawidek 23742d1661a5SPawel Jakub Dawidek /* Decode metadata. */ 23752d1661a5SPawel Jakub Dawidek error = raid3_metadata_decode(buf, md); 23762d1661a5SPawel Jakub Dawidek g_free(buf); 23772d1661a5SPawel Jakub Dawidek if (strcmp(md->md_magic, G_RAID3_MAGIC) != 0) 23782d1661a5SPawel Jakub Dawidek return (EINVAL); 23792d1661a5SPawel Jakub Dawidek if (error != 0) { 23802d1661a5SPawel Jakub Dawidek G_RAID3_DEBUG(1, "MD5 metadata hash mismatch for provider %s.", 23812d1661a5SPawel Jakub Dawidek cp->provider->name); 23822d1661a5SPawel Jakub Dawidek return (error); 23832d1661a5SPawel Jakub Dawidek } 23842d1661a5SPawel Jakub Dawidek 23852d1661a5SPawel Jakub Dawidek return (0); 23862d1661a5SPawel Jakub Dawidek } 23872d1661a5SPawel Jakub Dawidek 23882d1661a5SPawel Jakub Dawidek static int 23892d1661a5SPawel Jakub Dawidek g_raid3_check_metadata(struct g_raid3_softc *sc, struct g_provider *pp, 23902d1661a5SPawel Jakub Dawidek struct g_raid3_metadata *md) 23912d1661a5SPawel Jakub Dawidek { 23922d1661a5SPawel Jakub Dawidek 23932d1661a5SPawel Jakub Dawidek if (md->md_no >= sc->sc_ndisks) { 23942d1661a5SPawel Jakub Dawidek G_RAID3_DEBUG(1, "Invalid disk %s number (no=%u), skipping.", 23952d1661a5SPawel Jakub Dawidek pp->name, md->md_no); 23962d1661a5SPawel Jakub Dawidek return (EINVAL); 23972d1661a5SPawel Jakub Dawidek } 23982d1661a5SPawel Jakub Dawidek if (sc->sc_disks[md->md_no].d_state != G_RAID3_DISK_STATE_NODISK) { 23992d1661a5SPawel Jakub Dawidek G_RAID3_DEBUG(1, "Disk %s (no=%u) already exists, skipping.", 24002d1661a5SPawel Jakub Dawidek pp->name, md->md_no); 24012d1661a5SPawel Jakub Dawidek return (EEXIST); 24022d1661a5SPawel Jakub Dawidek } 24032d1661a5SPawel Jakub Dawidek if (md->md_all != sc->sc_ndisks) { 24042d1661a5SPawel Jakub Dawidek G_RAID3_DEBUG(1, 24052d1661a5SPawel Jakub Dawidek "Invalid '%s' field on disk %s (device %s), skipping.", 24062d1661a5SPawel Jakub Dawidek "md_all", pp->name, sc->sc_name); 24072d1661a5SPawel Jakub Dawidek return (EINVAL); 24082d1661a5SPawel Jakub Dawidek } 24092d1661a5SPawel Jakub Dawidek if (md->md_mediasize != sc->sc_mediasize) { 24102d1661a5SPawel Jakub Dawidek G_RAID3_DEBUG(1, 24112d1661a5SPawel Jakub Dawidek "Invalid '%s' field on disk %s (device %s), skipping.", 24122d1661a5SPawel Jakub Dawidek "md_mediasize", pp->name, sc->sc_name); 24132d1661a5SPawel Jakub Dawidek return (EINVAL); 24142d1661a5SPawel Jakub Dawidek } 24152d1661a5SPawel Jakub Dawidek if ((md->md_mediasize % (sc->sc_ndisks - 1)) != 0) { 24162d1661a5SPawel Jakub Dawidek G_RAID3_DEBUG(1, 24172d1661a5SPawel Jakub Dawidek "Invalid '%s' field on disk %s (device %s), skipping.", 24182d1661a5SPawel Jakub Dawidek "md_mediasize", pp->name, sc->sc_name); 24192d1661a5SPawel Jakub Dawidek return (EINVAL); 24202d1661a5SPawel Jakub Dawidek } 24212d1661a5SPawel Jakub Dawidek if ((sc->sc_mediasize / (sc->sc_ndisks - 1)) > pp->mediasize) { 24222d1661a5SPawel Jakub Dawidek G_RAID3_DEBUG(1, 24232d1661a5SPawel Jakub Dawidek "Invalid size of disk %s (device %s), skipping.", pp->name, 24242d1661a5SPawel Jakub Dawidek sc->sc_name); 24252d1661a5SPawel Jakub Dawidek return (EINVAL); 24262d1661a5SPawel Jakub Dawidek } 24272d1661a5SPawel Jakub Dawidek if ((md->md_sectorsize / pp->sectorsize) < sc->sc_ndisks - 1) { 24282d1661a5SPawel Jakub Dawidek G_RAID3_DEBUG(1, 24292d1661a5SPawel Jakub Dawidek "Invalid '%s' field on disk %s (device %s), skipping.", 24302d1661a5SPawel Jakub Dawidek "md_sectorsize", pp->name, sc->sc_name); 24312d1661a5SPawel Jakub Dawidek return (EINVAL); 24322d1661a5SPawel Jakub Dawidek } 24332d1661a5SPawel Jakub Dawidek if (md->md_sectorsize != sc->sc_sectorsize) { 24342d1661a5SPawel Jakub Dawidek G_RAID3_DEBUG(1, 24352d1661a5SPawel Jakub Dawidek "Invalid '%s' field on disk %s (device %s), skipping.", 24362d1661a5SPawel Jakub Dawidek "md_sectorsize", pp->name, sc->sc_name); 24372d1661a5SPawel Jakub Dawidek return (EINVAL); 24382d1661a5SPawel Jakub Dawidek } 24392d1661a5SPawel Jakub Dawidek if ((sc->sc_sectorsize % pp->sectorsize) != 0) { 24402d1661a5SPawel Jakub Dawidek G_RAID3_DEBUG(1, 24412d1661a5SPawel Jakub Dawidek "Invalid sector size of disk %s (device %s), skipping.", 24422d1661a5SPawel Jakub Dawidek pp->name, sc->sc_name); 24432d1661a5SPawel Jakub Dawidek return (EINVAL); 24442d1661a5SPawel Jakub Dawidek } 24452d1661a5SPawel Jakub Dawidek if ((md->md_mflags & ~G_RAID3_DEVICE_FLAG_MASK) != 0) { 24462d1661a5SPawel Jakub Dawidek G_RAID3_DEBUG(1, 24472d1661a5SPawel Jakub Dawidek "Invalid device flags on disk %s (device %s), skipping.", 24482d1661a5SPawel Jakub Dawidek pp->name, sc->sc_name); 24492d1661a5SPawel Jakub Dawidek return (EINVAL); 24502d1661a5SPawel Jakub Dawidek } 2451dba915cfSPawel Jakub Dawidek if ((md->md_mflags & G_RAID3_DEVICE_FLAG_VERIFY) != 0 && 2452dba915cfSPawel Jakub Dawidek (md->md_mflags & G_RAID3_DEVICE_FLAG_ROUND_ROBIN) != 0) { 2453dba915cfSPawel Jakub Dawidek /* 2454dba915cfSPawel Jakub Dawidek * VERIFY and ROUND-ROBIN options are mutally exclusive. 2455dba915cfSPawel Jakub Dawidek */ 2456dba915cfSPawel Jakub Dawidek G_RAID3_DEBUG(1, "Both VERIFY and ROUND-ROBIN flags exist on " 2457dba915cfSPawel Jakub Dawidek "disk %s (device %s), skipping.", pp->name, sc->sc_name); 2458dba915cfSPawel Jakub Dawidek return (EINVAL); 2459dba915cfSPawel Jakub Dawidek } 24602d1661a5SPawel Jakub Dawidek if ((md->md_dflags & ~G_RAID3_DISK_FLAG_MASK) != 0) { 24612d1661a5SPawel Jakub Dawidek G_RAID3_DEBUG(1, 24622d1661a5SPawel Jakub Dawidek "Invalid disk flags on disk %s (device %s), skipping.", 24632d1661a5SPawel Jakub Dawidek pp->name, sc->sc_name); 24642d1661a5SPawel Jakub Dawidek return (EINVAL); 24652d1661a5SPawel Jakub Dawidek } 24662d1661a5SPawel Jakub Dawidek return (0); 24672d1661a5SPawel Jakub Dawidek } 24682d1661a5SPawel Jakub Dawidek 24692d1661a5SPawel Jakub Dawidek static int 24702d1661a5SPawel Jakub Dawidek g_raid3_add_disk(struct g_raid3_softc *sc, struct g_provider *pp, 24712d1661a5SPawel Jakub Dawidek struct g_raid3_metadata *md) 24722d1661a5SPawel Jakub Dawidek { 24732d1661a5SPawel Jakub Dawidek struct g_raid3_disk *disk; 24742d1661a5SPawel Jakub Dawidek int error; 24752d1661a5SPawel Jakub Dawidek 24762d1661a5SPawel Jakub Dawidek g_topology_assert(); 24772d1661a5SPawel Jakub Dawidek G_RAID3_DEBUG(2, "Adding disk %s.", pp->name); 24782d1661a5SPawel Jakub Dawidek 24792d1661a5SPawel Jakub Dawidek error = g_raid3_check_metadata(sc, pp, md); 24802d1661a5SPawel Jakub Dawidek if (error != 0) 24812d1661a5SPawel Jakub Dawidek return (error); 24822d1661a5SPawel Jakub Dawidek disk = g_raid3_init_disk(sc, pp, md, &error); 24832d1661a5SPawel Jakub Dawidek if (disk == NULL) 24842d1661a5SPawel Jakub Dawidek return (error); 24852d1661a5SPawel Jakub Dawidek error = g_raid3_event_send(disk, G_RAID3_DISK_STATE_NEW, 24862d1661a5SPawel Jakub Dawidek G_RAID3_EVENT_WAIT); 24872d1661a5SPawel Jakub Dawidek return (error); 24882d1661a5SPawel Jakub Dawidek } 24892d1661a5SPawel Jakub Dawidek 24902d1661a5SPawel Jakub Dawidek static int 24912d1661a5SPawel Jakub Dawidek g_raid3_access(struct g_provider *pp, int acr, int acw, int ace) 24922d1661a5SPawel Jakub Dawidek { 24932d1661a5SPawel Jakub Dawidek struct g_raid3_softc *sc; 24942d1661a5SPawel Jakub Dawidek struct g_raid3_disk *disk; 24952d1661a5SPawel Jakub Dawidek int dcr, dcw, dce, err, error; 24962d1661a5SPawel Jakub Dawidek u_int n; 24972d1661a5SPawel Jakub Dawidek 24982d1661a5SPawel Jakub Dawidek g_topology_assert(); 24992d1661a5SPawel Jakub Dawidek G_RAID3_DEBUG(2, "Access request for %s: r%dw%de%d.", pp->name, acr, 25002d1661a5SPawel Jakub Dawidek acw, ace); 25012d1661a5SPawel Jakub Dawidek 25022d1661a5SPawel Jakub Dawidek dcr = pp->acr + acr; 25032d1661a5SPawel Jakub Dawidek dcw = pp->acw + acw; 25042d1661a5SPawel Jakub Dawidek dce = pp->ace + ace; 25052d1661a5SPawel Jakub Dawidek 25062d1661a5SPawel Jakub Dawidek /* On first open, grab an extra "exclusive" bit */ 25072d1661a5SPawel Jakub Dawidek if (pp->acr == 0 && pp->acw == 0 && pp->ace == 0) 25082d1661a5SPawel Jakub Dawidek ace++; 25092d1661a5SPawel Jakub Dawidek /* ... and let go of it on last close */ 25102d1661a5SPawel Jakub Dawidek if (dcr == 0 && dcw == 0 && dce == 0) 25112d1661a5SPawel Jakub Dawidek ace--; 25122d1661a5SPawel Jakub Dawidek 25132d1661a5SPawel Jakub Dawidek sc = pp->geom->softc; 25142d1661a5SPawel Jakub Dawidek if (sc == NULL || 25152d1661a5SPawel Jakub Dawidek g_raid3_ndisks(sc, G_RAID3_DISK_STATE_ACTIVE) < sc->sc_ndisks - 1) { 25162d1661a5SPawel Jakub Dawidek if (acr <= 0 && acw <= 0 && ace <= 0) 25172d1661a5SPawel Jakub Dawidek return (0); 25182d1661a5SPawel Jakub Dawidek else 25192d1661a5SPawel Jakub Dawidek return (ENXIO); 25202d1661a5SPawel Jakub Dawidek } 25212d1661a5SPawel Jakub Dawidek error = ENXIO; 25222d1661a5SPawel Jakub Dawidek for (n = 0; n < sc->sc_ndisks; n++) { 25232d1661a5SPawel Jakub Dawidek disk = &sc->sc_disks[n]; 25242d1661a5SPawel Jakub Dawidek if (disk->d_state != G_RAID3_DISK_STATE_ACTIVE) 25252d1661a5SPawel Jakub Dawidek continue; 25262d1661a5SPawel Jakub Dawidek err = g_access(disk->d_consumer, acr, acw, ace); 25272d1661a5SPawel Jakub Dawidek G_RAID3_DEBUG(2, "Access %s r%dw%de%d = %d", 25282d1661a5SPawel Jakub Dawidek g_raid3_get_diskname(disk), acr, acw, ace, err); 25292d1661a5SPawel Jakub Dawidek if (err == 0) { 25302d1661a5SPawel Jakub Dawidek /* 25312d1661a5SPawel Jakub Dawidek * Mark disk as dirty on open and unmark on close. 25322d1661a5SPawel Jakub Dawidek */ 25332d1661a5SPawel Jakub Dawidek if (pp->acw == 0 && dcw > 0) { 25342d1661a5SPawel Jakub Dawidek G_RAID3_DEBUG(1, 25352d1661a5SPawel Jakub Dawidek "Disk %s (device %s) marked as dirty.", 25362d1661a5SPawel Jakub Dawidek g_raid3_get_diskname(disk), sc->sc_name); 25372d1661a5SPawel Jakub Dawidek disk->d_flags |= G_RAID3_DISK_FLAG_DIRTY; 25382d1661a5SPawel Jakub Dawidek g_raid3_update_metadata(disk); 25392d1661a5SPawel Jakub Dawidek } else if (pp->acw > 0 && dcw == 0) { 25402d1661a5SPawel Jakub Dawidek G_RAID3_DEBUG(1, 25412d1661a5SPawel Jakub Dawidek "Disk %s (device %s) marked as clean.", 25422d1661a5SPawel Jakub Dawidek g_raid3_get_diskname(disk), sc->sc_name); 25432d1661a5SPawel Jakub Dawidek disk->d_flags &= ~G_RAID3_DISK_FLAG_DIRTY; 25442d1661a5SPawel Jakub Dawidek g_raid3_update_metadata(disk); 25452d1661a5SPawel Jakub Dawidek } 25462d1661a5SPawel Jakub Dawidek error = 0; 25472d1661a5SPawel Jakub Dawidek } else { 25482d1661a5SPawel Jakub Dawidek sc->sc_bump_syncid = G_RAID3_BUMP_ON_FIRST_WRITE; 25492d1661a5SPawel Jakub Dawidek g_raid3_event_send(disk, 25502d1661a5SPawel Jakub Dawidek G_RAID3_DISK_STATE_DISCONNECTED, 25512d1661a5SPawel Jakub Dawidek G_RAID3_EVENT_DONTWAIT); 25522d1661a5SPawel Jakub Dawidek } 25532d1661a5SPawel Jakub Dawidek } 25542d1661a5SPawel Jakub Dawidek return (error); 25552d1661a5SPawel Jakub Dawidek } 25562d1661a5SPawel Jakub Dawidek 25572d1661a5SPawel Jakub Dawidek static struct g_geom * 25582d1661a5SPawel Jakub Dawidek g_raid3_create(struct g_class *mp, const struct g_raid3_metadata *md) 25592d1661a5SPawel Jakub Dawidek { 25602d1661a5SPawel Jakub Dawidek struct g_raid3_softc *sc; 25612d1661a5SPawel Jakub Dawidek struct g_geom *gp; 25622d1661a5SPawel Jakub Dawidek int error, timeout; 25632d1661a5SPawel Jakub Dawidek u_int n; 25642d1661a5SPawel Jakub Dawidek 25652d1661a5SPawel Jakub Dawidek g_topology_assert(); 25662d1661a5SPawel Jakub Dawidek G_RAID3_DEBUG(1, "Creating device %s (id=%u).", md->md_name, md->md_id); 25672d1661a5SPawel Jakub Dawidek 25682d1661a5SPawel Jakub Dawidek /* One disk is minimum. */ 25692d1661a5SPawel Jakub Dawidek if (md->md_all < 1) 25702d1661a5SPawel Jakub Dawidek return (NULL); 25712d1661a5SPawel Jakub Dawidek /* 25722d1661a5SPawel Jakub Dawidek * Action geom. 25732d1661a5SPawel Jakub Dawidek */ 25742d1661a5SPawel Jakub Dawidek gp = g_new_geomf(mp, "%s", md->md_name); 25752d1661a5SPawel Jakub Dawidek sc = malloc(sizeof(*sc), M_RAID3, M_WAITOK | M_ZERO); 25762d1661a5SPawel Jakub Dawidek sc->sc_disks = malloc(sizeof(struct g_raid3_disk) * md->md_all, M_RAID3, 25772d1661a5SPawel Jakub Dawidek M_WAITOK | M_ZERO); 25782d1661a5SPawel Jakub Dawidek gp->start = g_raid3_start; 25792d1661a5SPawel Jakub Dawidek gp->spoiled = g_raid3_spoiled; 25802d1661a5SPawel Jakub Dawidek gp->orphan = g_raid3_orphan; 25812d1661a5SPawel Jakub Dawidek gp->access = g_raid3_access; 25822d1661a5SPawel Jakub Dawidek gp->dumpconf = g_raid3_dumpconf; 25832d1661a5SPawel Jakub Dawidek 25842d1661a5SPawel Jakub Dawidek sc->sc_id = md->md_id; 25852d1661a5SPawel Jakub Dawidek sc->sc_mediasize = md->md_mediasize; 25862d1661a5SPawel Jakub Dawidek sc->sc_sectorsize = md->md_sectorsize; 25872d1661a5SPawel Jakub Dawidek sc->sc_ndisks = md->md_all; 2588f5a2f7feSPawel Jakub Dawidek sc->sc_round_robin = 0; 25892d1661a5SPawel Jakub Dawidek sc->sc_flags = md->md_mflags; 25902d1661a5SPawel Jakub Dawidek sc->sc_bump_syncid = 0; 25912d1661a5SPawel Jakub Dawidek for (n = 0; n < sc->sc_ndisks; n++) 25922d1661a5SPawel Jakub Dawidek sc->sc_disks[n].d_state = G_RAID3_DISK_STATE_NODISK; 25932d1661a5SPawel Jakub Dawidek bioq_init(&sc->sc_queue); 25942d1661a5SPawel Jakub Dawidek mtx_init(&sc->sc_queue_mtx, "graid3:queue", NULL, MTX_DEF); 25952d1661a5SPawel Jakub Dawidek TAILQ_INIT(&sc->sc_events); 25962d1661a5SPawel Jakub Dawidek mtx_init(&sc->sc_events_mtx, "graid3:events", NULL, MTX_DEF); 25972d1661a5SPawel Jakub Dawidek callout_init(&sc->sc_callout, CALLOUT_MPSAFE); 25982d1661a5SPawel Jakub Dawidek sc->sc_state = G_RAID3_DEVICE_STATE_STARTING; 25992d1661a5SPawel Jakub Dawidek gp->softc = sc; 26002d1661a5SPawel Jakub Dawidek sc->sc_geom = gp; 26012d1661a5SPawel Jakub Dawidek sc->sc_provider = NULL; 26022d1661a5SPawel Jakub Dawidek /* 26032d1661a5SPawel Jakub Dawidek * Synchronization geom. 26042d1661a5SPawel Jakub Dawidek */ 26052d1661a5SPawel Jakub Dawidek gp = g_new_geomf(mp, "%s.sync", md->md_name); 26062d1661a5SPawel Jakub Dawidek gp->softc = sc; 26072d1661a5SPawel Jakub Dawidek gp->orphan = g_raid3_orphan; 26082d1661a5SPawel Jakub Dawidek sc->sc_sync.ds_geom = gp; 26092d1661a5SPawel Jakub Dawidek sc->sc_zone_64k = uma_zcreate("gr3:64k", 65536, NULL, NULL, NULL, NULL, 26102d1661a5SPawel Jakub Dawidek UMA_ALIGN_PTR, 0); 26112d1661a5SPawel Jakub Dawidek uma_zone_set_max(sc->sc_zone_64k, g_raid3_n64k); 26122d1661a5SPawel Jakub Dawidek sc->sc_zone_16k = uma_zcreate("gr3:16k", 16384, NULL, NULL, NULL, NULL, 26132d1661a5SPawel Jakub Dawidek UMA_ALIGN_PTR, 0); 26142d1661a5SPawel Jakub Dawidek uma_zone_set_max(sc->sc_zone_64k, g_raid3_n16k); 26152d1661a5SPawel Jakub Dawidek sc->sc_zone_4k = uma_zcreate("gr3:4k", 4096, NULL, NULL, NULL, NULL, 26162d1661a5SPawel Jakub Dawidek UMA_ALIGN_PTR, 0); 26172d1661a5SPawel Jakub Dawidek uma_zone_set_max(sc->sc_zone_4k, g_raid3_n4k); 26182d1661a5SPawel Jakub Dawidek error = kthread_create(g_raid3_worker, sc, &sc->sc_worker, 0, 0, 26192d1661a5SPawel Jakub Dawidek "g_raid3 %s", md->md_name); 26202d1661a5SPawel Jakub Dawidek if (error != 0) { 26212d1661a5SPawel Jakub Dawidek G_RAID3_DEBUG(1, "Cannot create kernel thread for %s.", 26222d1661a5SPawel Jakub Dawidek sc->sc_name); 26232d1661a5SPawel Jakub Dawidek uma_zdestroy(sc->sc_zone_64k); 26242d1661a5SPawel Jakub Dawidek uma_zdestroy(sc->sc_zone_16k); 26252d1661a5SPawel Jakub Dawidek uma_zdestroy(sc->sc_zone_4k); 26262d1661a5SPawel Jakub Dawidek g_destroy_geom(sc->sc_sync.ds_geom); 26272d1661a5SPawel Jakub Dawidek mtx_destroy(&sc->sc_events_mtx); 26282d1661a5SPawel Jakub Dawidek mtx_destroy(&sc->sc_queue_mtx); 26292d1661a5SPawel Jakub Dawidek g_destroy_geom(sc->sc_geom); 26302d1661a5SPawel Jakub Dawidek free(sc->sc_disks, M_RAID3); 26312d1661a5SPawel Jakub Dawidek free(sc, M_RAID3); 26322d1661a5SPawel Jakub Dawidek return (NULL); 26332d1661a5SPawel Jakub Dawidek } 26342d1661a5SPawel Jakub Dawidek 26352d1661a5SPawel Jakub Dawidek G_RAID3_DEBUG(0, "Device %s created (id=%u).", sc->sc_name, sc->sc_id); 26362d1661a5SPawel Jakub Dawidek 26372d1661a5SPawel Jakub Dawidek /* 26382d1661a5SPawel Jakub Dawidek * Run timeout. 26392d1661a5SPawel Jakub Dawidek */ 26402d1661a5SPawel Jakub Dawidek timeout = atomic_load_acq_int(&g_raid3_timeout); 26412d1661a5SPawel Jakub Dawidek callout_reset(&sc->sc_callout, timeout * hz, g_raid3_go, sc); 26422d1661a5SPawel Jakub Dawidek return (sc->sc_geom); 26432d1661a5SPawel Jakub Dawidek } 26442d1661a5SPawel Jakub Dawidek 26452d1661a5SPawel Jakub Dawidek int 26462d1661a5SPawel Jakub Dawidek g_raid3_destroy(struct g_raid3_softc *sc, boolean_t force) 26472d1661a5SPawel Jakub Dawidek { 26482d1661a5SPawel Jakub Dawidek struct g_provider *pp; 26492d1661a5SPawel Jakub Dawidek 26502d1661a5SPawel Jakub Dawidek g_topology_assert(); 26512d1661a5SPawel Jakub Dawidek 26522d1661a5SPawel Jakub Dawidek if (sc == NULL) 26532d1661a5SPawel Jakub Dawidek return (ENXIO); 26542d1661a5SPawel Jakub Dawidek pp = sc->sc_provider; 26552d1661a5SPawel Jakub Dawidek if (pp != NULL && (pp->acr != 0 || pp->acw != 0 || pp->ace != 0)) { 26562d1661a5SPawel Jakub Dawidek if (force) { 26572d1661a5SPawel Jakub Dawidek G_RAID3_DEBUG(0, "Device %s is still open, so it " 26582d1661a5SPawel Jakub Dawidek "can't be definitely removed.", pp->name); 26592d1661a5SPawel Jakub Dawidek } else { 26602d1661a5SPawel Jakub Dawidek G_RAID3_DEBUG(1, 26612d1661a5SPawel Jakub Dawidek "Device %s is still open (r%dw%de%d).", pp->name, 26622d1661a5SPawel Jakub Dawidek pp->acr, pp->acw, pp->ace); 26632d1661a5SPawel Jakub Dawidek return (EBUSY); 26642d1661a5SPawel Jakub Dawidek } 26652d1661a5SPawel Jakub Dawidek } 26662d1661a5SPawel Jakub Dawidek 26672d1661a5SPawel Jakub Dawidek sc->sc_flags |= G_RAID3_DEVICE_FLAG_DESTROY; 26682d1661a5SPawel Jakub Dawidek sc->sc_flags |= G_RAID3_DEVICE_FLAG_WAIT; 26692d1661a5SPawel Jakub Dawidek g_topology_unlock(); 26702d1661a5SPawel Jakub Dawidek G_RAID3_DEBUG(4, "%s: Waking up %p.", __func__, sc); 26712d1661a5SPawel Jakub Dawidek mtx_lock(&sc->sc_queue_mtx); 26722d1661a5SPawel Jakub Dawidek wakeup(sc); 26732d1661a5SPawel Jakub Dawidek wakeup(&sc->sc_queue); 26742d1661a5SPawel Jakub Dawidek mtx_unlock(&sc->sc_queue_mtx); 26752d1661a5SPawel Jakub Dawidek G_RAID3_DEBUG(4, "%s: Sleeping %p.", __func__, &sc->sc_worker); 26762d1661a5SPawel Jakub Dawidek while (sc->sc_worker != NULL) 26772d1661a5SPawel Jakub Dawidek tsleep(&sc->sc_worker, PRIBIO, "r3:destroy", hz / 5); 26782d1661a5SPawel Jakub Dawidek G_RAID3_DEBUG(4, "%s: Woken up %p.", __func__, &sc->sc_worker); 26792d1661a5SPawel Jakub Dawidek g_topology_lock(); 26802d1661a5SPawel Jakub Dawidek g_raid3_destroy_device(sc); 26812d1661a5SPawel Jakub Dawidek free(sc->sc_disks, M_RAID3); 26822d1661a5SPawel Jakub Dawidek free(sc, M_RAID3); 26832d1661a5SPawel Jakub Dawidek return (0); 26842d1661a5SPawel Jakub Dawidek } 26852d1661a5SPawel Jakub Dawidek 26862d1661a5SPawel Jakub Dawidek static void 26872d1661a5SPawel Jakub Dawidek g_raid3_taste_orphan(struct g_consumer *cp) 26882d1661a5SPawel Jakub Dawidek { 26892d1661a5SPawel Jakub Dawidek 26902d1661a5SPawel Jakub Dawidek KASSERT(1 == 0, ("%s called while tasting %s.", __func__, 26912d1661a5SPawel Jakub Dawidek cp->provider->name)); 26922d1661a5SPawel Jakub Dawidek } 26932d1661a5SPawel Jakub Dawidek 26942d1661a5SPawel Jakub Dawidek static struct g_geom * 26952d1661a5SPawel Jakub Dawidek g_raid3_taste(struct g_class *mp, struct g_provider *pp, int flags __unused) 26962d1661a5SPawel Jakub Dawidek { 26972d1661a5SPawel Jakub Dawidek struct g_raid3_metadata md; 26982d1661a5SPawel Jakub Dawidek struct g_raid3_softc *sc; 26992d1661a5SPawel Jakub Dawidek struct g_consumer *cp; 27002d1661a5SPawel Jakub Dawidek struct g_geom *gp; 27012d1661a5SPawel Jakub Dawidek int error; 27022d1661a5SPawel Jakub Dawidek 27032d1661a5SPawel Jakub Dawidek g_topology_assert(); 27042d1661a5SPawel Jakub Dawidek g_trace(G_T_TOPOLOGY, "%s(%s, %s)", __func__, mp->name, pp->name); 27052d1661a5SPawel Jakub Dawidek G_RAID3_DEBUG(2, "Tasting %s.", pp->name); 270629c78ab3SPawel Jakub Dawidek /* Skip providers with 0 sectorsize. */ 270729c78ab3SPawel Jakub Dawidek if (pp->sectorsize == 0) 270829c78ab3SPawel Jakub Dawidek return (NULL); 27092d1661a5SPawel Jakub Dawidek 27102d1661a5SPawel Jakub Dawidek gp = g_new_geomf(mp, "raid3:taste"); 27112d1661a5SPawel Jakub Dawidek /* This orphan function should be never called. */ 27122d1661a5SPawel Jakub Dawidek gp->orphan = g_raid3_taste_orphan; 27132d1661a5SPawel Jakub Dawidek cp = g_new_consumer(gp); 27142d1661a5SPawel Jakub Dawidek g_attach(cp, pp); 27152d1661a5SPawel Jakub Dawidek error = g_raid3_read_metadata(cp, &md); 27162d1661a5SPawel Jakub Dawidek g_detach(cp); 27172d1661a5SPawel Jakub Dawidek g_destroy_consumer(cp); 27182d1661a5SPawel Jakub Dawidek g_destroy_geom(gp); 27192d1661a5SPawel Jakub Dawidek if (error != 0) 27202d1661a5SPawel Jakub Dawidek return (NULL); 27212d1661a5SPawel Jakub Dawidek gp = NULL; 27222d1661a5SPawel Jakub Dawidek 27232d1661a5SPawel Jakub Dawidek if (md.md_version > G_RAID3_VERSION) { 27242d1661a5SPawel Jakub Dawidek printf("geom_raid3.ko module is too old to handle %s.\n", 27252d1661a5SPawel Jakub Dawidek pp->name); 27262d1661a5SPawel Jakub Dawidek return (NULL); 27272d1661a5SPawel Jakub Dawidek } 27282d1661a5SPawel Jakub Dawidek if (md.md_provider[0] != '\0' && strcmp(md.md_provider, pp->name) != 0) 27292d1661a5SPawel Jakub Dawidek return (NULL); 27302d1661a5SPawel Jakub Dawidek if (g_raid3_debug >= 2) 27312d1661a5SPawel Jakub Dawidek raid3_metadata_dump(&md); 27322d1661a5SPawel Jakub Dawidek 27332d1661a5SPawel Jakub Dawidek /* 27342d1661a5SPawel Jakub Dawidek * Let's check if device already exists. 27352d1661a5SPawel Jakub Dawidek */ 27362d1661a5SPawel Jakub Dawidek LIST_FOREACH(gp, &mp->geom, geom) { 27372d1661a5SPawel Jakub Dawidek sc = gp->softc; 27382d1661a5SPawel Jakub Dawidek if (sc == NULL) 27392d1661a5SPawel Jakub Dawidek continue; 27402d1661a5SPawel Jakub Dawidek if (sc->sc_sync.ds_geom == gp) 27412d1661a5SPawel Jakub Dawidek continue; 27422d1661a5SPawel Jakub Dawidek if (strcmp(md.md_name, sc->sc_name) != 0) 27432d1661a5SPawel Jakub Dawidek continue; 27442d1661a5SPawel Jakub Dawidek if (md.md_id != sc->sc_id) { 27452d1661a5SPawel Jakub Dawidek G_RAID3_DEBUG(0, "Device %s already configured.", 27462d1661a5SPawel Jakub Dawidek sc->sc_name); 27472d1661a5SPawel Jakub Dawidek return (NULL); 27482d1661a5SPawel Jakub Dawidek } 27492d1661a5SPawel Jakub Dawidek break; 27502d1661a5SPawel Jakub Dawidek } 27512d1661a5SPawel Jakub Dawidek if (gp == NULL) { 27522d1661a5SPawel Jakub Dawidek gp = g_raid3_create(mp, &md); 27532d1661a5SPawel Jakub Dawidek if (gp == NULL) { 27542d1661a5SPawel Jakub Dawidek G_RAID3_DEBUG(0, "Cannot create device %s.", 27552d1661a5SPawel Jakub Dawidek md.md_name); 27562d1661a5SPawel Jakub Dawidek return (NULL); 27572d1661a5SPawel Jakub Dawidek } 27582d1661a5SPawel Jakub Dawidek sc = gp->softc; 27592d1661a5SPawel Jakub Dawidek } 27602d1661a5SPawel Jakub Dawidek G_RAID3_DEBUG(1, "Adding disk %s to %s.", pp->name, gp->name); 27612d1661a5SPawel Jakub Dawidek error = g_raid3_add_disk(sc, pp, &md); 27622d1661a5SPawel Jakub Dawidek if (error != 0) { 27632d1661a5SPawel Jakub Dawidek G_RAID3_DEBUG(0, "Cannot add disk %s to %s (error=%d).", 27642d1661a5SPawel Jakub Dawidek pp->name, gp->name, error); 27652d1661a5SPawel Jakub Dawidek if (g_raid3_ndisks(sc, G_RAID3_DISK_STATE_NODISK) == 27662d1661a5SPawel Jakub Dawidek sc->sc_ndisks) { 27672d1661a5SPawel Jakub Dawidek g_raid3_destroy(sc, 1); 27682d1661a5SPawel Jakub Dawidek } 27692d1661a5SPawel Jakub Dawidek return (NULL); 27702d1661a5SPawel Jakub Dawidek } 27712d1661a5SPawel Jakub Dawidek return (gp); 27722d1661a5SPawel Jakub Dawidek } 27732d1661a5SPawel Jakub Dawidek 27742d1661a5SPawel Jakub Dawidek static int 27752d1661a5SPawel Jakub Dawidek g_raid3_destroy_geom(struct gctl_req *req __unused, struct g_class *mp __unused, 27762d1661a5SPawel Jakub Dawidek struct g_geom *gp) 27772d1661a5SPawel Jakub Dawidek { 27782d1661a5SPawel Jakub Dawidek 27792d1661a5SPawel Jakub Dawidek return (g_raid3_destroy(gp->softc, 0)); 27802d1661a5SPawel Jakub Dawidek } 27812d1661a5SPawel Jakub Dawidek 27822d1661a5SPawel Jakub Dawidek static void 27832d1661a5SPawel Jakub Dawidek g_raid3_dumpconf(struct sbuf *sb, const char *indent, struct g_geom *gp, 27842d1661a5SPawel Jakub Dawidek struct g_consumer *cp, struct g_provider *pp) 27852d1661a5SPawel Jakub Dawidek { 27862d1661a5SPawel Jakub Dawidek struct g_raid3_softc *sc; 27872d1661a5SPawel Jakub Dawidek 27882d1661a5SPawel Jakub Dawidek g_topology_assert(); 27892d1661a5SPawel Jakub Dawidek 27902d1661a5SPawel Jakub Dawidek sc = gp->softc; 27912d1661a5SPawel Jakub Dawidek if (sc == NULL) 27922d1661a5SPawel Jakub Dawidek return; 27932d1661a5SPawel Jakub Dawidek /* Skip synchronization geom. */ 27942d1661a5SPawel Jakub Dawidek if (gp == sc->sc_sync.ds_geom) 27952d1661a5SPawel Jakub Dawidek return; 27962d1661a5SPawel Jakub Dawidek if (pp != NULL) { 27972d1661a5SPawel Jakub Dawidek /* Nothing here. */ 27982d1661a5SPawel Jakub Dawidek } else if (cp != NULL) { 27992d1661a5SPawel Jakub Dawidek struct g_raid3_disk *disk; 28002d1661a5SPawel Jakub Dawidek 28012d1661a5SPawel Jakub Dawidek disk = cp->private; 28022d1661a5SPawel Jakub Dawidek if (disk == NULL) 28032d1661a5SPawel Jakub Dawidek return; 28042d1661a5SPawel Jakub Dawidek sbuf_printf(sb, "%s<Type>", indent); 28052d1661a5SPawel Jakub Dawidek if (disk->d_no == sc->sc_ndisks - 1) 28062d1661a5SPawel Jakub Dawidek sbuf_printf(sb, "PARITY"); 28072d1661a5SPawel Jakub Dawidek else 28082d1661a5SPawel Jakub Dawidek sbuf_printf(sb, "DATA"); 28092d1661a5SPawel Jakub Dawidek sbuf_printf(sb, "</Type>\n"); 28102d1661a5SPawel Jakub Dawidek sbuf_printf(sb, "%s<Number>%u</Number>\n", indent, 28112d1661a5SPawel Jakub Dawidek (u_int)disk->d_no); 28122d1661a5SPawel Jakub Dawidek if (disk->d_state == G_RAID3_DISK_STATE_SYNCHRONIZING) { 28132d1661a5SPawel Jakub Dawidek sbuf_printf(sb, "%s<Synchronized>", indent); 28142d1661a5SPawel Jakub Dawidek if (disk->d_sync.ds_offset_done == 0) 28152d1661a5SPawel Jakub Dawidek sbuf_printf(sb, "0%%"); 28162d1661a5SPawel Jakub Dawidek else { 28172d1661a5SPawel Jakub Dawidek sbuf_printf(sb, "%u%%", 28182d1661a5SPawel Jakub Dawidek (u_int)((disk->d_sync.ds_offset_done * 100) / 2819c0d68b6eSPawel Jakub Dawidek (sc->sc_mediasize / (sc->sc_ndisks - 1)))); 28202d1661a5SPawel Jakub Dawidek } 28212d1661a5SPawel Jakub Dawidek sbuf_printf(sb, "</Synchronized>\n"); 28222d1661a5SPawel Jakub Dawidek } 28232d1661a5SPawel Jakub Dawidek sbuf_printf(sb, "%s<SyncID>%u</SyncID>\n", indent, 28242d1661a5SPawel Jakub Dawidek disk->d_sync.ds_syncid); 28252d1661a5SPawel Jakub Dawidek sbuf_printf(sb, "%s<Flags>", indent); 28262d1661a5SPawel Jakub Dawidek if (disk->d_flags == 0) 28272d1661a5SPawel Jakub Dawidek sbuf_printf(sb, "NONE"); 28282d1661a5SPawel Jakub Dawidek else { 28292d1661a5SPawel Jakub Dawidek int first = 1; 28302d1661a5SPawel Jakub Dawidek 28312d1661a5SPawel Jakub Dawidek #define ADD_FLAG(flag, name) do { \ 28322d1661a5SPawel Jakub Dawidek if ((disk->d_flags & (flag)) != 0) { \ 28332d1661a5SPawel Jakub Dawidek if (!first) \ 28342d1661a5SPawel Jakub Dawidek sbuf_printf(sb, ", "); \ 28352d1661a5SPawel Jakub Dawidek else \ 28362d1661a5SPawel Jakub Dawidek first = 0; \ 28372d1661a5SPawel Jakub Dawidek sbuf_printf(sb, name); \ 28382d1661a5SPawel Jakub Dawidek } \ 28392d1661a5SPawel Jakub Dawidek } while (0) 28402d1661a5SPawel Jakub Dawidek ADD_FLAG(G_RAID3_DISK_FLAG_DIRTY, "DIRTY"); 28412d1661a5SPawel Jakub Dawidek ADD_FLAG(G_RAID3_DISK_FLAG_HARDCODED, "HARDCODED"); 28422d1661a5SPawel Jakub Dawidek ADD_FLAG(G_RAID3_DISK_FLAG_SYNCHRONIZING, 28432d1661a5SPawel Jakub Dawidek "SYNCHRONIZING"); 28442d1661a5SPawel Jakub Dawidek ADD_FLAG(G_RAID3_DISK_FLAG_FORCE_SYNC, "FORCE_SYNC"); 28452d1661a5SPawel Jakub Dawidek #undef ADD_FLAG 28462d1661a5SPawel Jakub Dawidek } 28472d1661a5SPawel Jakub Dawidek sbuf_printf(sb, "</Flags>\n"); 28482d1661a5SPawel Jakub Dawidek sbuf_printf(sb, "%s<State>%s</State>\n", indent, 28492d1661a5SPawel Jakub Dawidek g_raid3_disk_state2str(disk->d_state)); 28502d1661a5SPawel Jakub Dawidek } else { 28512d1661a5SPawel Jakub Dawidek sbuf_printf(sb, "%s<ID>%u</ID>\n", indent, (u_int)sc->sc_id); 28522d1661a5SPawel Jakub Dawidek sbuf_printf(sb, "%s<SyncID>%u</SyncID>\n", indent, sc->sc_syncid); 28532d1661a5SPawel Jakub Dawidek sbuf_printf(sb, "%s<Flags>", indent); 28542d1661a5SPawel Jakub Dawidek if (sc->sc_flags == 0) 28552d1661a5SPawel Jakub Dawidek sbuf_printf(sb, "NONE"); 28562d1661a5SPawel Jakub Dawidek else { 28572d1661a5SPawel Jakub Dawidek int first = 1; 28582d1661a5SPawel Jakub Dawidek 28592d1661a5SPawel Jakub Dawidek #define ADD_FLAG(flag, name) do { \ 28602d1661a5SPawel Jakub Dawidek if ((sc->sc_flags & (flag)) != 0) { \ 28612d1661a5SPawel Jakub Dawidek if (!first) \ 28622d1661a5SPawel Jakub Dawidek sbuf_printf(sb, ", "); \ 28632d1661a5SPawel Jakub Dawidek else \ 28642d1661a5SPawel Jakub Dawidek first = 0; \ 28652d1661a5SPawel Jakub Dawidek sbuf_printf(sb, name); \ 28662d1661a5SPawel Jakub Dawidek } \ 28672d1661a5SPawel Jakub Dawidek } while (0) 28682d1661a5SPawel Jakub Dawidek ADD_FLAG(G_RAID3_DEVICE_FLAG_NOAUTOSYNC, "NOAUTOSYNC"); 2869f5a2f7feSPawel Jakub Dawidek ADD_FLAG(G_RAID3_DEVICE_FLAG_ROUND_ROBIN, 2870f5a2f7feSPawel Jakub Dawidek "ROUND-ROBIN"); 2871dba915cfSPawel Jakub Dawidek ADD_FLAG(G_RAID3_DEVICE_FLAG_VERIFY, "VERIFY"); 28722d1661a5SPawel Jakub Dawidek #undef ADD_FLAG 28732d1661a5SPawel Jakub Dawidek } 28742d1661a5SPawel Jakub Dawidek sbuf_printf(sb, "</Flags>\n"); 28752d1661a5SPawel Jakub Dawidek sbuf_printf(sb, "%s<Components>%u</Components>\n", indent, 28762d1661a5SPawel Jakub Dawidek sc->sc_ndisks); 287728b31df7SPawel Jakub Dawidek sbuf_printf(sb, "%s<State>%s</State>\n", indent, 287828b31df7SPawel Jakub Dawidek g_raid3_device_state2str(sc->sc_state)); 28792d1661a5SPawel Jakub Dawidek } 28802d1661a5SPawel Jakub Dawidek } 28812d1661a5SPawel Jakub Dawidek 28822d1661a5SPawel Jakub Dawidek DECLARE_GEOM_CLASS(g_raid3_class, g_raid3); 2883