12d1661a5SPawel Jakub Dawidek /*- 2e6757059SPawel Jakub Dawidek * Copyright (c) 2004-2006 Pawel Jakub Dawidek <pjd@FreeBSD.org> 32d1661a5SPawel Jakub Dawidek * All rights reserved. 42d1661a5SPawel Jakub Dawidek * 52d1661a5SPawel Jakub Dawidek * Redistribution and use in source and binary forms, with or without 62d1661a5SPawel Jakub Dawidek * modification, are permitted provided that the following conditions 72d1661a5SPawel Jakub Dawidek * are met: 82d1661a5SPawel Jakub Dawidek * 1. Redistributions of source code must retain the above copyright 92d1661a5SPawel Jakub Dawidek * notice, this list of conditions and the following disclaimer. 102d1661a5SPawel Jakub Dawidek * 2. Redistributions in binary form must reproduce the above copyright 112d1661a5SPawel Jakub Dawidek * notice, this list of conditions and the following disclaimer in the 122d1661a5SPawel Jakub Dawidek * documentation and/or other materials provided with the distribution. 132d1661a5SPawel Jakub Dawidek * 142d1661a5SPawel Jakub Dawidek * THIS SOFTWARE IS PROVIDED BY THE AUTHORS AND CONTRIBUTORS ``AS IS'' AND 152d1661a5SPawel Jakub Dawidek * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE 162d1661a5SPawel Jakub Dawidek * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE 172d1661a5SPawel Jakub Dawidek * ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHORS OR CONTRIBUTORS BE LIABLE 182d1661a5SPawel Jakub Dawidek * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL 192d1661a5SPawel Jakub Dawidek * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS 202d1661a5SPawel Jakub Dawidek * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) 212d1661a5SPawel Jakub Dawidek * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT 222d1661a5SPawel Jakub Dawidek * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY 232d1661a5SPawel Jakub Dawidek * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF 242d1661a5SPawel Jakub Dawidek * SUCH DAMAGE. 252d1661a5SPawel Jakub Dawidek */ 262d1661a5SPawel Jakub Dawidek 272d1661a5SPawel Jakub Dawidek #include <sys/cdefs.h> 282d1661a5SPawel Jakub Dawidek __FBSDID("$FreeBSD$"); 292d1661a5SPawel Jakub Dawidek 302d1661a5SPawel Jakub Dawidek #include <sys/param.h> 312d1661a5SPawel Jakub Dawidek #include <sys/systm.h> 322d1661a5SPawel Jakub Dawidek #include <sys/kernel.h> 332d1661a5SPawel Jakub Dawidek #include <sys/module.h> 342d1661a5SPawel Jakub Dawidek #include <sys/limits.h> 352d1661a5SPawel Jakub Dawidek #include <sys/lock.h> 362d1661a5SPawel Jakub Dawidek #include <sys/mutex.h> 372d1661a5SPawel Jakub Dawidek #include <sys/bio.h> 385d807a0eSAndrey V. Elsukov #include <sys/sbuf.h> 392d1661a5SPawel Jakub Dawidek #include <sys/sysctl.h> 402d1661a5SPawel Jakub Dawidek #include <sys/malloc.h> 419da3072cSPawel Jakub Dawidek #include <sys/eventhandler.h> 422d1661a5SPawel Jakub Dawidek #include <vm/uma.h> 432d1661a5SPawel Jakub Dawidek #include <geom/geom.h> 442d1661a5SPawel Jakub Dawidek #include <sys/proc.h> 452d1661a5SPawel Jakub Dawidek #include <sys/kthread.h> 4663710c4dSJohn Baldwin #include <sys/sched.h> 472d1661a5SPawel Jakub Dawidek #include <geom/raid3/g_raid3.h> 482d1661a5SPawel Jakub Dawidek 49cb08c2ccSAlexander Leidinger FEATURE(geom_raid3, "GEOM RAID-3 functionality"); 502d1661a5SPawel Jakub Dawidek 515bb84bc8SRobert Watson static MALLOC_DEFINE(M_RAID3, "raid3_data", "GEOM_RAID3 Data"); 522d1661a5SPawel Jakub Dawidek 532d1661a5SPawel Jakub Dawidek SYSCTL_DECL(_kern_geom); 546472ac3dSEd Schouten static SYSCTL_NODE(_kern_geom, OID_AUTO, raid3, CTLFLAG_RW, 0, 556472ac3dSEd Schouten "GEOM_RAID3 stuff"); 56809a9dc6SPawel Jakub Dawidek u_int g_raid3_debug = 0; 576d7b8aecSPawel Jakub Dawidek TUNABLE_INT("kern.geom.raid3.debug", &g_raid3_debug); 582d1661a5SPawel Jakub Dawidek SYSCTL_UINT(_kern_geom_raid3, OID_AUTO, debug, CTLFLAG_RW, &g_raid3_debug, 0, 592d1661a5SPawel Jakub Dawidek "Debug level"); 60e5e7825cSPawel Jakub Dawidek static u_int g_raid3_timeout = 4; 614d006a98SPawel Jakub Dawidek TUNABLE_INT("kern.geom.raid3.timeout", &g_raid3_timeout); 622d1661a5SPawel Jakub Dawidek SYSCTL_UINT(_kern_geom_raid3, OID_AUTO, timeout, CTLFLAG_RW, &g_raid3_timeout, 632d1661a5SPawel Jakub Dawidek 0, "Time to wait on all raid3 components"); 644d006a98SPawel Jakub Dawidek static u_int g_raid3_idletime = 5; 654d006a98SPawel Jakub Dawidek TUNABLE_INT("kern.geom.raid3.idletime", &g_raid3_idletime); 664d006a98SPawel Jakub Dawidek SYSCTL_UINT(_kern_geom_raid3, OID_AUTO, idletime, CTLFLAG_RW, 674d006a98SPawel Jakub Dawidek &g_raid3_idletime, 0, "Mark components as clean when idling"); 683aae74ecSPawel Jakub Dawidek static u_int g_raid3_disconnect_on_failure = 1; 6967cae8aaSPawel Jakub Dawidek TUNABLE_INT("kern.geom.raid3.disconnect_on_failure", 7067cae8aaSPawel Jakub Dawidek &g_raid3_disconnect_on_failure); 713aae74ecSPawel Jakub Dawidek SYSCTL_UINT(_kern_geom_raid3, OID_AUTO, disconnect_on_failure, CTLFLAG_RW, 723aae74ecSPawel Jakub Dawidek &g_raid3_disconnect_on_failure, 0, "Disconnect component on I/O failure."); 73e6757059SPawel Jakub Dawidek static u_int g_raid3_syncreqs = 2; 743650be51SPawel Jakub Dawidek TUNABLE_INT("kern.geom.raid3.sync_requests", &g_raid3_syncreqs); 753650be51SPawel Jakub Dawidek SYSCTL_UINT(_kern_geom_raid3, OID_AUTO, sync_requests, CTLFLAG_RDTUN, 763650be51SPawel Jakub Dawidek &g_raid3_syncreqs, 0, "Parallel synchronization I/O requests."); 77ed940a82SPawel Jakub Dawidek static u_int g_raid3_use_malloc = 0; 78ed940a82SPawel Jakub Dawidek TUNABLE_INT("kern.geom.raid3.use_malloc", &g_raid3_use_malloc); 79ed940a82SPawel Jakub Dawidek SYSCTL_UINT(_kern_geom_raid3, OID_AUTO, use_malloc, CTLFLAG_RDTUN, 80ed940a82SPawel Jakub Dawidek &g_raid3_use_malloc, 0, "Use malloc(9) instead of uma(9)."); 812d1661a5SPawel Jakub Dawidek 822d1661a5SPawel Jakub Dawidek static u_int g_raid3_n64k = 50; 832d1661a5SPawel Jakub Dawidek TUNABLE_INT("kern.geom.raid3.n64k", &g_raid3_n64k); 842d1661a5SPawel Jakub Dawidek SYSCTL_UINT(_kern_geom_raid3, OID_AUTO, n64k, CTLFLAG_RD, &g_raid3_n64k, 0, 852d1661a5SPawel Jakub Dawidek "Maximum number of 64kB allocations"); 862d1661a5SPawel Jakub Dawidek static u_int g_raid3_n16k = 200; 872d1661a5SPawel Jakub Dawidek TUNABLE_INT("kern.geom.raid3.n16k", &g_raid3_n16k); 882d1661a5SPawel Jakub Dawidek SYSCTL_UINT(_kern_geom_raid3, OID_AUTO, n16k, CTLFLAG_RD, &g_raid3_n16k, 0, 892d1661a5SPawel Jakub Dawidek "Maximum number of 16kB allocations"); 902d1661a5SPawel Jakub Dawidek static u_int g_raid3_n4k = 1200; 912d1661a5SPawel Jakub Dawidek TUNABLE_INT("kern.geom.raid3.n4k", &g_raid3_n4k); 922d1661a5SPawel Jakub Dawidek SYSCTL_UINT(_kern_geom_raid3, OID_AUTO, n4k, CTLFLAG_RD, &g_raid3_n4k, 0, 932d1661a5SPawel Jakub Dawidek "Maximum number of 4kB allocations"); 942d1661a5SPawel Jakub Dawidek 956472ac3dSEd Schouten static SYSCTL_NODE(_kern_geom_raid3, OID_AUTO, stat, CTLFLAG_RW, 0, 962d1661a5SPawel Jakub Dawidek "GEOM_RAID3 statistics"); 97dba915cfSPawel Jakub Dawidek static u_int g_raid3_parity_mismatch = 0; 98dba915cfSPawel Jakub Dawidek SYSCTL_UINT(_kern_geom_raid3_stat, OID_AUTO, parity_mismatch, CTLFLAG_RD, 99dba915cfSPawel Jakub Dawidek &g_raid3_parity_mismatch, 0, "Number of failures in VERIFY mode"); 1002d1661a5SPawel Jakub Dawidek 1012d1661a5SPawel Jakub Dawidek #define MSLEEP(ident, mtx, priority, wmesg, timeout) do { \ 1022d1661a5SPawel Jakub Dawidek G_RAID3_DEBUG(4, "%s: Sleeping %p.", __func__, (ident)); \ 1032d1661a5SPawel Jakub Dawidek msleep((ident), (mtx), (priority), (wmesg), (timeout)); \ 1042d1661a5SPawel Jakub Dawidek G_RAID3_DEBUG(4, "%s: Woken up %p.", __func__, (ident)); \ 1052d1661a5SPawel Jakub Dawidek } while (0) 1062d1661a5SPawel Jakub Dawidek 107f62c1a47SAlexander Motin static eventhandler_tag g_raid3_post_sync = NULL; 108f62c1a47SAlexander Motin static int g_raid3_shutdown = 0; 1092d1661a5SPawel Jakub Dawidek 1102d1661a5SPawel Jakub Dawidek static int g_raid3_destroy_geom(struct gctl_req *req, struct g_class *mp, 1112d1661a5SPawel Jakub Dawidek struct g_geom *gp); 1122d1661a5SPawel Jakub Dawidek static g_taste_t g_raid3_taste; 1139da3072cSPawel Jakub Dawidek static void g_raid3_init(struct g_class *mp); 1149da3072cSPawel Jakub Dawidek static void g_raid3_fini(struct g_class *mp); 1152d1661a5SPawel Jakub Dawidek 1162d1661a5SPawel Jakub Dawidek struct g_class g_raid3_class = { 1172d1661a5SPawel Jakub Dawidek .name = G_RAID3_CLASS_NAME, 1182d1661a5SPawel Jakub Dawidek .version = G_VERSION, 1192d1661a5SPawel Jakub Dawidek .ctlreq = g_raid3_config, 1202d1661a5SPawel Jakub Dawidek .taste = g_raid3_taste, 1219da3072cSPawel Jakub Dawidek .destroy_geom = g_raid3_destroy_geom, 1229da3072cSPawel Jakub Dawidek .init = g_raid3_init, 1239da3072cSPawel Jakub Dawidek .fini = g_raid3_fini 1242d1661a5SPawel Jakub Dawidek }; 1252d1661a5SPawel Jakub Dawidek 1262d1661a5SPawel Jakub Dawidek 1272d1661a5SPawel Jakub Dawidek static void g_raid3_destroy_provider(struct g_raid3_softc *sc); 128d97d5ee9SPawel Jakub Dawidek static int g_raid3_update_disk(struct g_raid3_disk *disk, u_int state); 129d97d5ee9SPawel Jakub Dawidek static void g_raid3_update_device(struct g_raid3_softc *sc, boolean_t force); 1302d1661a5SPawel Jakub Dawidek static void g_raid3_dumpconf(struct sbuf *sb, const char *indent, 1312d1661a5SPawel Jakub Dawidek struct g_geom *gp, struct g_consumer *cp, struct g_provider *pp); 1322d1661a5SPawel Jakub Dawidek static void g_raid3_sync_stop(struct g_raid3_softc *sc, int type); 1333650be51SPawel Jakub Dawidek static int g_raid3_register_request(struct bio *pbp); 1343650be51SPawel Jakub Dawidek static void g_raid3_sync_release(struct g_raid3_softc *sc); 1352d1661a5SPawel Jakub Dawidek 1362d1661a5SPawel Jakub Dawidek 1372d1661a5SPawel Jakub Dawidek static const char * 1382d1661a5SPawel Jakub Dawidek g_raid3_disk_state2str(int state) 1392d1661a5SPawel Jakub Dawidek { 1402d1661a5SPawel Jakub Dawidek 1412d1661a5SPawel Jakub Dawidek switch (state) { 1422d1661a5SPawel Jakub Dawidek case G_RAID3_DISK_STATE_NODISK: 1432d1661a5SPawel Jakub Dawidek return ("NODISK"); 1442d1661a5SPawel Jakub Dawidek case G_RAID3_DISK_STATE_NONE: 1452d1661a5SPawel Jakub Dawidek return ("NONE"); 1462d1661a5SPawel Jakub Dawidek case G_RAID3_DISK_STATE_NEW: 1472d1661a5SPawel Jakub Dawidek return ("NEW"); 1482d1661a5SPawel Jakub Dawidek case G_RAID3_DISK_STATE_ACTIVE: 1492d1661a5SPawel Jakub Dawidek return ("ACTIVE"); 1502d1661a5SPawel Jakub Dawidek case G_RAID3_DISK_STATE_STALE: 1512d1661a5SPawel Jakub Dawidek return ("STALE"); 1522d1661a5SPawel Jakub Dawidek case G_RAID3_DISK_STATE_SYNCHRONIZING: 1532d1661a5SPawel Jakub Dawidek return ("SYNCHRONIZING"); 1542d1661a5SPawel Jakub Dawidek case G_RAID3_DISK_STATE_DISCONNECTED: 1552d1661a5SPawel Jakub Dawidek return ("DISCONNECTED"); 1562d1661a5SPawel Jakub Dawidek default: 1572d1661a5SPawel Jakub Dawidek return ("INVALID"); 1582d1661a5SPawel Jakub Dawidek } 1592d1661a5SPawel Jakub Dawidek } 1602d1661a5SPawel Jakub Dawidek 1612d1661a5SPawel Jakub Dawidek static const char * 1622d1661a5SPawel Jakub Dawidek g_raid3_device_state2str(int state) 1632d1661a5SPawel Jakub Dawidek { 1642d1661a5SPawel Jakub Dawidek 1652d1661a5SPawel Jakub Dawidek switch (state) { 1662d1661a5SPawel Jakub Dawidek case G_RAID3_DEVICE_STATE_STARTING: 1672d1661a5SPawel Jakub Dawidek return ("STARTING"); 1682d1661a5SPawel Jakub Dawidek case G_RAID3_DEVICE_STATE_DEGRADED: 1692d1661a5SPawel Jakub Dawidek return ("DEGRADED"); 1702d1661a5SPawel Jakub Dawidek case G_RAID3_DEVICE_STATE_COMPLETE: 1712d1661a5SPawel Jakub Dawidek return ("COMPLETE"); 1722d1661a5SPawel Jakub Dawidek default: 1732d1661a5SPawel Jakub Dawidek return ("INVALID"); 1742d1661a5SPawel Jakub Dawidek } 1752d1661a5SPawel Jakub Dawidek } 1762d1661a5SPawel Jakub Dawidek 1772d1661a5SPawel Jakub Dawidek const char * 1782d1661a5SPawel Jakub Dawidek g_raid3_get_diskname(struct g_raid3_disk *disk) 1792d1661a5SPawel Jakub Dawidek { 1802d1661a5SPawel Jakub Dawidek 1812d1661a5SPawel Jakub Dawidek if (disk->d_consumer == NULL || disk->d_consumer->provider == NULL) 1822d1661a5SPawel Jakub Dawidek return ("[unknown]"); 1832d1661a5SPawel Jakub Dawidek return (disk->d_name); 1842d1661a5SPawel Jakub Dawidek } 1852d1661a5SPawel Jakub Dawidek 186ed940a82SPawel Jakub Dawidek static void * 187ed940a82SPawel Jakub Dawidek g_raid3_alloc(struct g_raid3_softc *sc, size_t size, int flags) 188ed940a82SPawel Jakub Dawidek { 189ed940a82SPawel Jakub Dawidek void *ptr; 190d4060fa6SAlexander Motin enum g_raid3_zones zone; 191ed940a82SPawel Jakub Dawidek 192d4060fa6SAlexander Motin if (g_raid3_use_malloc || 193d4060fa6SAlexander Motin (zone = g_raid3_zone(size)) == G_RAID3_NUM_ZONES) 194ed940a82SPawel Jakub Dawidek ptr = malloc(size, M_RAID3, flags); 195ed940a82SPawel Jakub Dawidek else { 196d4060fa6SAlexander Motin ptr = uma_zalloc_arg(sc->sc_zones[zone].sz_zone, 197d4060fa6SAlexander Motin &sc->sc_zones[zone], flags); 198d4060fa6SAlexander Motin sc->sc_zones[zone].sz_requested++; 199ed940a82SPawel Jakub Dawidek if (ptr == NULL) 200d4060fa6SAlexander Motin sc->sc_zones[zone].sz_failed++; 201ed940a82SPawel Jakub Dawidek } 202ed940a82SPawel Jakub Dawidek return (ptr); 203ed940a82SPawel Jakub Dawidek } 204ed940a82SPawel Jakub Dawidek 205ed940a82SPawel Jakub Dawidek static void 206ed940a82SPawel Jakub Dawidek g_raid3_free(struct g_raid3_softc *sc, void *ptr, size_t size) 207ed940a82SPawel Jakub Dawidek { 208d4060fa6SAlexander Motin enum g_raid3_zones zone; 209ed940a82SPawel Jakub Dawidek 210d4060fa6SAlexander Motin if (g_raid3_use_malloc || 211d4060fa6SAlexander Motin (zone = g_raid3_zone(size)) == G_RAID3_NUM_ZONES) 212ed940a82SPawel Jakub Dawidek free(ptr, M_RAID3); 213ed940a82SPawel Jakub Dawidek else { 214d4060fa6SAlexander Motin uma_zfree_arg(sc->sc_zones[zone].sz_zone, 215d4060fa6SAlexander Motin ptr, &sc->sc_zones[zone]); 216ed940a82SPawel Jakub Dawidek } 217ed940a82SPawel Jakub Dawidek } 218ed940a82SPawel Jakub Dawidek 2193650be51SPawel Jakub Dawidek static int 2203650be51SPawel Jakub Dawidek g_raid3_uma_ctor(void *mem, int size, void *arg, int flags) 2213650be51SPawel Jakub Dawidek { 2223650be51SPawel Jakub Dawidek struct g_raid3_zone *sz = arg; 2233650be51SPawel Jakub Dawidek 2240d14fae5SPawel Jakub Dawidek if (sz->sz_max > 0 && sz->sz_inuse == sz->sz_max) 2253650be51SPawel Jakub Dawidek return (ENOMEM); 2263650be51SPawel Jakub Dawidek sz->sz_inuse++; 2273650be51SPawel Jakub Dawidek return (0); 2283650be51SPawel Jakub Dawidek } 2293650be51SPawel Jakub Dawidek 2303650be51SPawel Jakub Dawidek static void 2313650be51SPawel Jakub Dawidek g_raid3_uma_dtor(void *mem, int size, void *arg) 2323650be51SPawel Jakub Dawidek { 2333650be51SPawel Jakub Dawidek struct g_raid3_zone *sz = arg; 2343650be51SPawel Jakub Dawidek 2353650be51SPawel Jakub Dawidek sz->sz_inuse--; 2363650be51SPawel Jakub Dawidek } 2373650be51SPawel Jakub Dawidek 23806b215fdSAlexander Motin #define g_raid3_xor(src, dst, size) \ 23906b215fdSAlexander Motin _g_raid3_xor((uint64_t *)(src), \ 2402d1661a5SPawel Jakub Dawidek (uint64_t *)(dst), (size_t)size) 2412d1661a5SPawel Jakub Dawidek static void 24206b215fdSAlexander Motin _g_raid3_xor(uint64_t *src, uint64_t *dst, size_t size) 2432d1661a5SPawel Jakub Dawidek { 2442d1661a5SPawel Jakub Dawidek 2452d1661a5SPawel Jakub Dawidek KASSERT((size % 128) == 0, ("Invalid size: %zu.", size)); 2462d1661a5SPawel Jakub Dawidek for (; size > 0; size -= 128) { 24706b215fdSAlexander Motin *dst++ ^= (*src++); 24806b215fdSAlexander Motin *dst++ ^= (*src++); 24906b215fdSAlexander Motin *dst++ ^= (*src++); 25006b215fdSAlexander Motin *dst++ ^= (*src++); 25106b215fdSAlexander Motin *dst++ ^= (*src++); 25206b215fdSAlexander Motin *dst++ ^= (*src++); 25306b215fdSAlexander Motin *dst++ ^= (*src++); 25406b215fdSAlexander Motin *dst++ ^= (*src++); 25506b215fdSAlexander Motin *dst++ ^= (*src++); 25606b215fdSAlexander Motin *dst++ ^= (*src++); 25706b215fdSAlexander Motin *dst++ ^= (*src++); 25806b215fdSAlexander Motin *dst++ ^= (*src++); 25906b215fdSAlexander Motin *dst++ ^= (*src++); 26006b215fdSAlexander Motin *dst++ ^= (*src++); 26106b215fdSAlexander Motin *dst++ ^= (*src++); 26206b215fdSAlexander Motin *dst++ ^= (*src++); 2632d1661a5SPawel Jakub Dawidek } 2642d1661a5SPawel Jakub Dawidek } 2652d1661a5SPawel Jakub Dawidek 266dba915cfSPawel Jakub Dawidek static int 267dba915cfSPawel Jakub Dawidek g_raid3_is_zero(struct bio *bp) 268dba915cfSPawel Jakub Dawidek { 269dba915cfSPawel Jakub Dawidek static const uint64_t zeros[] = { 270dba915cfSPawel Jakub Dawidek 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 271dba915cfSPawel Jakub Dawidek }; 272dba915cfSPawel Jakub Dawidek u_char *addr; 273dba915cfSPawel Jakub Dawidek ssize_t size; 274dba915cfSPawel Jakub Dawidek 275dba915cfSPawel Jakub Dawidek size = bp->bio_length; 276dba915cfSPawel Jakub Dawidek addr = (u_char *)bp->bio_data; 277dba915cfSPawel Jakub Dawidek for (; size > 0; size -= sizeof(zeros), addr += sizeof(zeros)) { 278dba915cfSPawel Jakub Dawidek if (bcmp(addr, zeros, sizeof(zeros)) != 0) 279dba915cfSPawel Jakub Dawidek return (0); 280dba915cfSPawel Jakub Dawidek } 281dba915cfSPawel Jakub Dawidek return (1); 282dba915cfSPawel Jakub Dawidek } 283dba915cfSPawel Jakub Dawidek 2842d1661a5SPawel Jakub Dawidek /* 2852d1661a5SPawel Jakub Dawidek * --- Events handling functions --- 2862d1661a5SPawel Jakub Dawidek * Events in geom_raid3 are used to maintain disks and device status 2872d1661a5SPawel Jakub Dawidek * from one thread to simplify locking. 2882d1661a5SPawel Jakub Dawidek */ 2892d1661a5SPawel Jakub Dawidek static void 2902d1661a5SPawel Jakub Dawidek g_raid3_event_free(struct g_raid3_event *ep) 2912d1661a5SPawel Jakub Dawidek { 2922d1661a5SPawel Jakub Dawidek 2932d1661a5SPawel Jakub Dawidek free(ep, M_RAID3); 2942d1661a5SPawel Jakub Dawidek } 2952d1661a5SPawel Jakub Dawidek 2962d1661a5SPawel Jakub Dawidek int 2972d1661a5SPawel Jakub Dawidek g_raid3_event_send(void *arg, int state, int flags) 2982d1661a5SPawel Jakub Dawidek { 2992d1661a5SPawel Jakub Dawidek struct g_raid3_softc *sc; 3002d1661a5SPawel Jakub Dawidek struct g_raid3_disk *disk; 3012d1661a5SPawel Jakub Dawidek struct g_raid3_event *ep; 3022d1661a5SPawel Jakub Dawidek int error; 3032d1661a5SPawel Jakub Dawidek 3042d1661a5SPawel Jakub Dawidek ep = malloc(sizeof(*ep), M_RAID3, M_WAITOK); 3052d1661a5SPawel Jakub Dawidek G_RAID3_DEBUG(4, "%s: Sending event %p.", __func__, ep); 3062d1661a5SPawel Jakub Dawidek if ((flags & G_RAID3_EVENT_DEVICE) != 0) { 3072d1661a5SPawel Jakub Dawidek disk = NULL; 3082d1661a5SPawel Jakub Dawidek sc = arg; 3092d1661a5SPawel Jakub Dawidek } else { 3102d1661a5SPawel Jakub Dawidek disk = arg; 3112d1661a5SPawel Jakub Dawidek sc = disk->d_softc; 3122d1661a5SPawel Jakub Dawidek } 3132d1661a5SPawel Jakub Dawidek ep->e_disk = disk; 3142d1661a5SPawel Jakub Dawidek ep->e_state = state; 3152d1661a5SPawel Jakub Dawidek ep->e_flags = flags; 3162d1661a5SPawel Jakub Dawidek ep->e_error = 0; 3172d1661a5SPawel Jakub Dawidek mtx_lock(&sc->sc_events_mtx); 3182d1661a5SPawel Jakub Dawidek TAILQ_INSERT_TAIL(&sc->sc_events, ep, e_next); 3192d1661a5SPawel Jakub Dawidek mtx_unlock(&sc->sc_events_mtx); 3202d1661a5SPawel Jakub Dawidek G_RAID3_DEBUG(4, "%s: Waking up %p.", __func__, sc); 3212d1661a5SPawel Jakub Dawidek mtx_lock(&sc->sc_queue_mtx); 3222d1661a5SPawel Jakub Dawidek wakeup(sc); 3232d1661a5SPawel Jakub Dawidek wakeup(&sc->sc_queue); 3242d1661a5SPawel Jakub Dawidek mtx_unlock(&sc->sc_queue_mtx); 3252d1661a5SPawel Jakub Dawidek if ((flags & G_RAID3_EVENT_DONTWAIT) != 0) 3262d1661a5SPawel Jakub Dawidek return (0); 3273650be51SPawel Jakub Dawidek sx_assert(&sc->sc_lock, SX_XLOCKED); 3282d1661a5SPawel Jakub Dawidek G_RAID3_DEBUG(4, "%s: Sleeping %p.", __func__, ep); 3293650be51SPawel Jakub Dawidek sx_xunlock(&sc->sc_lock); 3302d1661a5SPawel Jakub Dawidek while ((ep->e_flags & G_RAID3_EVENT_DONE) == 0) { 3312d1661a5SPawel Jakub Dawidek mtx_lock(&sc->sc_events_mtx); 3322d1661a5SPawel Jakub Dawidek MSLEEP(ep, &sc->sc_events_mtx, PRIBIO | PDROP, "r3:event", 3332d1661a5SPawel Jakub Dawidek hz * 5); 3342d1661a5SPawel Jakub Dawidek } 3352d1661a5SPawel Jakub Dawidek error = ep->e_error; 3362d1661a5SPawel Jakub Dawidek g_raid3_event_free(ep); 3373650be51SPawel Jakub Dawidek sx_xlock(&sc->sc_lock); 3382d1661a5SPawel Jakub Dawidek return (error); 3392d1661a5SPawel Jakub Dawidek } 3402d1661a5SPawel Jakub Dawidek 3412d1661a5SPawel Jakub Dawidek static struct g_raid3_event * 3422d1661a5SPawel Jakub Dawidek g_raid3_event_get(struct g_raid3_softc *sc) 3432d1661a5SPawel Jakub Dawidek { 3442d1661a5SPawel Jakub Dawidek struct g_raid3_event *ep; 3452d1661a5SPawel Jakub Dawidek 3462d1661a5SPawel Jakub Dawidek mtx_lock(&sc->sc_events_mtx); 3472d1661a5SPawel Jakub Dawidek ep = TAILQ_FIRST(&sc->sc_events); 3482d1661a5SPawel Jakub Dawidek mtx_unlock(&sc->sc_events_mtx); 3492d1661a5SPawel Jakub Dawidek return (ep); 3502d1661a5SPawel Jakub Dawidek } 3512d1661a5SPawel Jakub Dawidek 3522d1661a5SPawel Jakub Dawidek static void 353d97d5ee9SPawel Jakub Dawidek g_raid3_event_remove(struct g_raid3_softc *sc, struct g_raid3_event *ep) 354d97d5ee9SPawel Jakub Dawidek { 355d97d5ee9SPawel Jakub Dawidek 356d97d5ee9SPawel Jakub Dawidek mtx_lock(&sc->sc_events_mtx); 357d97d5ee9SPawel Jakub Dawidek TAILQ_REMOVE(&sc->sc_events, ep, e_next); 358d97d5ee9SPawel Jakub Dawidek mtx_unlock(&sc->sc_events_mtx); 359d97d5ee9SPawel Jakub Dawidek } 360d97d5ee9SPawel Jakub Dawidek 361d97d5ee9SPawel Jakub Dawidek static void 3622d1661a5SPawel Jakub Dawidek g_raid3_event_cancel(struct g_raid3_disk *disk) 3632d1661a5SPawel Jakub Dawidek { 3642d1661a5SPawel Jakub Dawidek struct g_raid3_softc *sc; 3652d1661a5SPawel Jakub Dawidek struct g_raid3_event *ep, *tmpep; 3662d1661a5SPawel Jakub Dawidek 3672d1661a5SPawel Jakub Dawidek sc = disk->d_softc; 3683650be51SPawel Jakub Dawidek sx_assert(&sc->sc_lock, SX_XLOCKED); 3693650be51SPawel Jakub Dawidek 3702d1661a5SPawel Jakub Dawidek mtx_lock(&sc->sc_events_mtx); 3712d1661a5SPawel Jakub Dawidek TAILQ_FOREACH_SAFE(ep, &sc->sc_events, e_next, tmpep) { 3722d1661a5SPawel Jakub Dawidek if ((ep->e_flags & G_RAID3_EVENT_DEVICE) != 0) 3732d1661a5SPawel Jakub Dawidek continue; 3742d1661a5SPawel Jakub Dawidek if (ep->e_disk != disk) 3752d1661a5SPawel Jakub Dawidek continue; 3762d1661a5SPawel Jakub Dawidek TAILQ_REMOVE(&sc->sc_events, ep, e_next); 3772d1661a5SPawel Jakub Dawidek if ((ep->e_flags & G_RAID3_EVENT_DONTWAIT) != 0) 3782d1661a5SPawel Jakub Dawidek g_raid3_event_free(ep); 3792d1661a5SPawel Jakub Dawidek else { 3802d1661a5SPawel Jakub Dawidek ep->e_error = ECANCELED; 3812d1661a5SPawel Jakub Dawidek wakeup(ep); 3822d1661a5SPawel Jakub Dawidek } 3832d1661a5SPawel Jakub Dawidek } 3842d1661a5SPawel Jakub Dawidek mtx_unlock(&sc->sc_events_mtx); 3852d1661a5SPawel Jakub Dawidek } 3862d1661a5SPawel Jakub Dawidek 3872d1661a5SPawel Jakub Dawidek /* 3882d1661a5SPawel Jakub Dawidek * Return the number of disks in the given state. 3892d1661a5SPawel Jakub Dawidek * If state is equal to -1, count all connected disks. 3902d1661a5SPawel Jakub Dawidek */ 3912d1661a5SPawel Jakub Dawidek u_int 3922d1661a5SPawel Jakub Dawidek g_raid3_ndisks(struct g_raid3_softc *sc, int state) 3932d1661a5SPawel Jakub Dawidek { 3942d1661a5SPawel Jakub Dawidek struct g_raid3_disk *disk; 395fa6a7837SDavid E. O'Brien u_int n, ndisks; 3962d1661a5SPawel Jakub Dawidek 3973650be51SPawel Jakub Dawidek sx_assert(&sc->sc_lock, SX_LOCKED); 3983650be51SPawel Jakub Dawidek 399fa6a7837SDavid E. O'Brien for (n = ndisks = 0; n < sc->sc_ndisks; n++) { 4002d1661a5SPawel Jakub Dawidek disk = &sc->sc_disks[n]; 4012d1661a5SPawel Jakub Dawidek if (disk->d_state == G_RAID3_DISK_STATE_NODISK) 4022d1661a5SPawel Jakub Dawidek continue; 4032d1661a5SPawel Jakub Dawidek if (state == -1 || disk->d_state == state) 4042d1661a5SPawel Jakub Dawidek ndisks++; 4052d1661a5SPawel Jakub Dawidek } 4062d1661a5SPawel Jakub Dawidek return (ndisks); 4072d1661a5SPawel Jakub Dawidek } 4082d1661a5SPawel Jakub Dawidek 4092d1661a5SPawel Jakub Dawidek static u_int 4102d1661a5SPawel Jakub Dawidek g_raid3_nrequests(struct g_raid3_softc *sc, struct g_consumer *cp) 4112d1661a5SPawel Jakub Dawidek { 4122d1661a5SPawel Jakub Dawidek struct bio *bp; 4132d1661a5SPawel Jakub Dawidek u_int nreqs = 0; 4142d1661a5SPawel Jakub Dawidek 4152d1661a5SPawel Jakub Dawidek mtx_lock(&sc->sc_queue_mtx); 4162d1661a5SPawel Jakub Dawidek TAILQ_FOREACH(bp, &sc->sc_queue.queue, bio_queue) { 4172d1661a5SPawel Jakub Dawidek if (bp->bio_from == cp) 4182d1661a5SPawel Jakub Dawidek nreqs++; 4192d1661a5SPawel Jakub Dawidek } 4202d1661a5SPawel Jakub Dawidek mtx_unlock(&sc->sc_queue_mtx); 4212d1661a5SPawel Jakub Dawidek return (nreqs); 4222d1661a5SPawel Jakub Dawidek } 4232d1661a5SPawel Jakub Dawidek 4242d1661a5SPawel Jakub Dawidek static int 4252d1661a5SPawel Jakub Dawidek g_raid3_is_busy(struct g_raid3_softc *sc, struct g_consumer *cp) 4262d1661a5SPawel Jakub Dawidek { 4272d1661a5SPawel Jakub Dawidek 42879e61493SPawel Jakub Dawidek if (cp->index > 0) { 4292d1661a5SPawel Jakub Dawidek G_RAID3_DEBUG(2, 4302d1661a5SPawel Jakub Dawidek "I/O requests for %s exist, can't destroy it now.", 4312d1661a5SPawel Jakub Dawidek cp->provider->name); 4322d1661a5SPawel Jakub Dawidek return (1); 4332d1661a5SPawel Jakub Dawidek } 4342d1661a5SPawel Jakub Dawidek if (g_raid3_nrequests(sc, cp) > 0) { 4352d1661a5SPawel Jakub Dawidek G_RAID3_DEBUG(2, 4362d1661a5SPawel Jakub Dawidek "I/O requests for %s in queue, can't destroy it now.", 4372d1661a5SPawel Jakub Dawidek cp->provider->name); 4382d1661a5SPawel Jakub Dawidek return (1); 4392d1661a5SPawel Jakub Dawidek } 4402d1661a5SPawel Jakub Dawidek return (0); 4412d1661a5SPawel Jakub Dawidek } 4422d1661a5SPawel Jakub Dawidek 4432d1661a5SPawel Jakub Dawidek static void 444d97d5ee9SPawel Jakub Dawidek g_raid3_destroy_consumer(void *arg, int flags __unused) 445d97d5ee9SPawel Jakub Dawidek { 446d97d5ee9SPawel Jakub Dawidek struct g_consumer *cp; 447d97d5ee9SPawel Jakub Dawidek 4483650be51SPawel Jakub Dawidek g_topology_assert(); 4493650be51SPawel Jakub Dawidek 450d97d5ee9SPawel Jakub Dawidek cp = arg; 451d97d5ee9SPawel Jakub Dawidek G_RAID3_DEBUG(1, "Consumer %s destroyed.", cp->provider->name); 452d97d5ee9SPawel Jakub Dawidek g_detach(cp); 453d97d5ee9SPawel Jakub Dawidek g_destroy_consumer(cp); 454d97d5ee9SPawel Jakub Dawidek } 455d97d5ee9SPawel Jakub Dawidek 456d97d5ee9SPawel Jakub Dawidek static void 4572d1661a5SPawel Jakub Dawidek g_raid3_kill_consumer(struct g_raid3_softc *sc, struct g_consumer *cp) 4582d1661a5SPawel Jakub Dawidek { 459d97d5ee9SPawel Jakub Dawidek struct g_provider *pp; 460d97d5ee9SPawel Jakub Dawidek int retaste_wait; 4612d1661a5SPawel Jakub Dawidek 4622d1661a5SPawel Jakub Dawidek g_topology_assert(); 4632d1661a5SPawel Jakub Dawidek 4642d1661a5SPawel Jakub Dawidek cp->private = NULL; 4652d1661a5SPawel Jakub Dawidek if (g_raid3_is_busy(sc, cp)) 4662d1661a5SPawel Jakub Dawidek return; 4672d1661a5SPawel Jakub Dawidek G_RAID3_DEBUG(2, "Consumer %s destroyed.", cp->provider->name); 468d97d5ee9SPawel Jakub Dawidek pp = cp->provider; 469d97d5ee9SPawel Jakub Dawidek retaste_wait = 0; 470d97d5ee9SPawel Jakub Dawidek if (cp->acw == 1) { 471d97d5ee9SPawel Jakub Dawidek if ((pp->geom->flags & G_GEOM_WITHER) == 0) 472d97d5ee9SPawel Jakub Dawidek retaste_wait = 1; 473d97d5ee9SPawel Jakub Dawidek } 474d97d5ee9SPawel Jakub Dawidek G_RAID3_DEBUG(2, "Access %s r%dw%de%d = %d", pp->name, -cp->acr, 475d97d5ee9SPawel Jakub Dawidek -cp->acw, -cp->ace, 0); 476d97d5ee9SPawel Jakub Dawidek if (cp->acr > 0 || cp->acw > 0 || cp->ace > 0) 477d97d5ee9SPawel Jakub Dawidek g_access(cp, -cp->acr, -cp->acw, -cp->ace); 478d97d5ee9SPawel Jakub Dawidek if (retaste_wait) { 479d97d5ee9SPawel Jakub Dawidek /* 480d97d5ee9SPawel Jakub Dawidek * After retaste event was send (inside g_access()), we can send 481d97d5ee9SPawel Jakub Dawidek * event to detach and destroy consumer. 482d97d5ee9SPawel Jakub Dawidek * A class, which has consumer to the given provider connected 483d97d5ee9SPawel Jakub Dawidek * will not receive retaste event for the provider. 484d97d5ee9SPawel Jakub Dawidek * This is the way how I ignore retaste events when I close 485d97d5ee9SPawel Jakub Dawidek * consumers opened for write: I detach and destroy consumer 486d97d5ee9SPawel Jakub Dawidek * after retaste event is sent. 487d97d5ee9SPawel Jakub Dawidek */ 488d97d5ee9SPawel Jakub Dawidek g_post_event(g_raid3_destroy_consumer, cp, M_WAITOK, NULL); 489d97d5ee9SPawel Jakub Dawidek return; 490d97d5ee9SPawel Jakub Dawidek } 491d97d5ee9SPawel Jakub Dawidek G_RAID3_DEBUG(1, "Consumer %s destroyed.", pp->name); 4922d1661a5SPawel Jakub Dawidek g_detach(cp); 4932d1661a5SPawel Jakub Dawidek g_destroy_consumer(cp); 4942d1661a5SPawel Jakub Dawidek } 4952d1661a5SPawel Jakub Dawidek 4962d1661a5SPawel Jakub Dawidek static int 4972d1661a5SPawel Jakub Dawidek g_raid3_connect_disk(struct g_raid3_disk *disk, struct g_provider *pp) 4982d1661a5SPawel Jakub Dawidek { 49934cb1517SPawel Jakub Dawidek struct g_consumer *cp; 5002d1661a5SPawel Jakub Dawidek int error; 5012d1661a5SPawel Jakub Dawidek 5023650be51SPawel Jakub Dawidek g_topology_assert_not(); 5032d1661a5SPawel Jakub Dawidek KASSERT(disk->d_consumer == NULL, 5042d1661a5SPawel Jakub Dawidek ("Disk already connected (device %s).", disk->d_softc->sc_name)); 5052d1661a5SPawel Jakub Dawidek 5063650be51SPawel Jakub Dawidek g_topology_lock(); 50734cb1517SPawel Jakub Dawidek cp = g_new_consumer(disk->d_softc->sc_geom); 50834cb1517SPawel Jakub Dawidek error = g_attach(cp, pp); 509d97d5ee9SPawel Jakub Dawidek if (error != 0) { 51034cb1517SPawel Jakub Dawidek g_destroy_consumer(cp); 5113650be51SPawel Jakub Dawidek g_topology_unlock(); 51234cb1517SPawel Jakub Dawidek return (error); 51334cb1517SPawel Jakub Dawidek } 51434cb1517SPawel Jakub Dawidek error = g_access(cp, 1, 1, 1); 5153650be51SPawel Jakub Dawidek g_topology_unlock(); 51634cb1517SPawel Jakub Dawidek if (error != 0) { 51734cb1517SPawel Jakub Dawidek g_detach(cp); 51834cb1517SPawel Jakub Dawidek g_destroy_consumer(cp); 519d97d5ee9SPawel Jakub Dawidek G_RAID3_DEBUG(0, "Cannot open consumer %s (error=%d).", 520d97d5ee9SPawel Jakub Dawidek pp->name, error); 521d97d5ee9SPawel Jakub Dawidek return (error); 522d97d5ee9SPawel Jakub Dawidek } 52334cb1517SPawel Jakub Dawidek disk->d_consumer = cp; 52434cb1517SPawel Jakub Dawidek disk->d_consumer->private = disk; 52534cb1517SPawel Jakub Dawidek disk->d_consumer->index = 0; 5262d1661a5SPawel Jakub Dawidek G_RAID3_DEBUG(2, "Disk %s connected.", g_raid3_get_diskname(disk)); 5272d1661a5SPawel Jakub Dawidek return (0); 5282d1661a5SPawel Jakub Dawidek } 5292d1661a5SPawel Jakub Dawidek 5302d1661a5SPawel Jakub Dawidek static void 5312d1661a5SPawel Jakub Dawidek g_raid3_disconnect_consumer(struct g_raid3_softc *sc, struct g_consumer *cp) 5322d1661a5SPawel Jakub Dawidek { 5332d1661a5SPawel Jakub Dawidek 5342d1661a5SPawel Jakub Dawidek g_topology_assert(); 5352d1661a5SPawel Jakub Dawidek 5362d1661a5SPawel Jakub Dawidek if (cp == NULL) 5372d1661a5SPawel Jakub Dawidek return; 538d97d5ee9SPawel Jakub Dawidek if (cp->provider != NULL) 5392d1661a5SPawel Jakub Dawidek g_raid3_kill_consumer(sc, cp); 540d97d5ee9SPawel Jakub Dawidek else 5412d1661a5SPawel Jakub Dawidek g_destroy_consumer(cp); 5422d1661a5SPawel Jakub Dawidek } 5432d1661a5SPawel Jakub Dawidek 5442d1661a5SPawel Jakub Dawidek /* 5452d1661a5SPawel Jakub Dawidek * Initialize disk. This means allocate memory, create consumer, attach it 5462d1661a5SPawel Jakub Dawidek * to the provider and open access (r1w1e1) to it. 5472d1661a5SPawel Jakub Dawidek */ 5482d1661a5SPawel Jakub Dawidek static struct g_raid3_disk * 5492d1661a5SPawel Jakub Dawidek g_raid3_init_disk(struct g_raid3_softc *sc, struct g_provider *pp, 5502d1661a5SPawel Jakub Dawidek struct g_raid3_metadata *md, int *errorp) 5512d1661a5SPawel Jakub Dawidek { 5522d1661a5SPawel Jakub Dawidek struct g_raid3_disk *disk; 5532d1661a5SPawel Jakub Dawidek int error; 5542d1661a5SPawel Jakub Dawidek 5552d1661a5SPawel Jakub Dawidek disk = &sc->sc_disks[md->md_no]; 5562d1661a5SPawel Jakub Dawidek error = g_raid3_connect_disk(disk, pp); 55734cb1517SPawel Jakub Dawidek if (error != 0) { 55834cb1517SPawel Jakub Dawidek if (errorp != NULL) 55934cb1517SPawel Jakub Dawidek *errorp = error; 56034cb1517SPawel Jakub Dawidek return (NULL); 56134cb1517SPawel Jakub Dawidek } 5622d1661a5SPawel Jakub Dawidek disk->d_state = G_RAID3_DISK_STATE_NONE; 5632d1661a5SPawel Jakub Dawidek disk->d_flags = md->md_dflags; 5642d1661a5SPawel Jakub Dawidek if (md->md_provider[0] != '\0') 5652d1661a5SPawel Jakub Dawidek disk->d_flags |= G_RAID3_DISK_FLAG_HARDCODED; 5662d1661a5SPawel Jakub Dawidek disk->d_sync.ds_consumer = NULL; 5672d1661a5SPawel Jakub Dawidek disk->d_sync.ds_offset = md->md_sync_offset; 5682d1661a5SPawel Jakub Dawidek disk->d_sync.ds_offset_done = md->md_sync_offset; 569a245a548SPawel Jakub Dawidek disk->d_genid = md->md_genid; 5702d1661a5SPawel Jakub Dawidek disk->d_sync.ds_syncid = md->md_syncid; 5712d1661a5SPawel Jakub Dawidek if (errorp != NULL) 5722d1661a5SPawel Jakub Dawidek *errorp = 0; 5732d1661a5SPawel Jakub Dawidek return (disk); 5742d1661a5SPawel Jakub Dawidek } 5752d1661a5SPawel Jakub Dawidek 5762d1661a5SPawel Jakub Dawidek static void 5772d1661a5SPawel Jakub Dawidek g_raid3_destroy_disk(struct g_raid3_disk *disk) 5782d1661a5SPawel Jakub Dawidek { 5792d1661a5SPawel Jakub Dawidek struct g_raid3_softc *sc; 5802d1661a5SPawel Jakub Dawidek 5813650be51SPawel Jakub Dawidek g_topology_assert_not(); 5823650be51SPawel Jakub Dawidek sc = disk->d_softc; 5833650be51SPawel Jakub Dawidek sx_assert(&sc->sc_lock, SX_XLOCKED); 5842d1661a5SPawel Jakub Dawidek 5852d1661a5SPawel Jakub Dawidek if (disk->d_state == G_RAID3_DISK_STATE_NODISK) 5862d1661a5SPawel Jakub Dawidek return; 5872d1661a5SPawel Jakub Dawidek g_raid3_event_cancel(disk); 5882d1661a5SPawel Jakub Dawidek switch (disk->d_state) { 5892d1661a5SPawel Jakub Dawidek case G_RAID3_DISK_STATE_SYNCHRONIZING: 5902d1661a5SPawel Jakub Dawidek if (sc->sc_syncdisk != NULL) 5912d1661a5SPawel Jakub Dawidek g_raid3_sync_stop(sc, 1); 5922d1661a5SPawel Jakub Dawidek /* FALLTHROUGH */ 5932d1661a5SPawel Jakub Dawidek case G_RAID3_DISK_STATE_NEW: 5942d1661a5SPawel Jakub Dawidek case G_RAID3_DISK_STATE_STALE: 5952d1661a5SPawel Jakub Dawidek case G_RAID3_DISK_STATE_ACTIVE: 5963650be51SPawel Jakub Dawidek g_topology_lock(); 5972d1661a5SPawel Jakub Dawidek g_raid3_disconnect_consumer(sc, disk->d_consumer); 5983650be51SPawel Jakub Dawidek g_topology_unlock(); 5992d1661a5SPawel Jakub Dawidek disk->d_consumer = NULL; 6002d1661a5SPawel Jakub Dawidek break; 6012d1661a5SPawel Jakub Dawidek default: 6022d1661a5SPawel Jakub Dawidek KASSERT(0 == 1, ("Wrong disk state (%s, %s).", 6032d1661a5SPawel Jakub Dawidek g_raid3_get_diskname(disk), 6042d1661a5SPawel Jakub Dawidek g_raid3_disk_state2str(disk->d_state))); 6052d1661a5SPawel Jakub Dawidek } 6062d1661a5SPawel Jakub Dawidek disk->d_state = G_RAID3_DISK_STATE_NODISK; 6072d1661a5SPawel Jakub Dawidek } 6082d1661a5SPawel Jakub Dawidek 6092d1661a5SPawel Jakub Dawidek static void 6102d1661a5SPawel Jakub Dawidek g_raid3_destroy_device(struct g_raid3_softc *sc) 6112d1661a5SPawel Jakub Dawidek { 6122d1661a5SPawel Jakub Dawidek struct g_raid3_event *ep; 6139da3072cSPawel Jakub Dawidek struct g_raid3_disk *disk; 6142d1661a5SPawel Jakub Dawidek struct g_geom *gp; 6152d1661a5SPawel Jakub Dawidek struct g_consumer *cp; 6162d1661a5SPawel Jakub Dawidek u_int n; 6172d1661a5SPawel Jakub Dawidek 6183650be51SPawel Jakub Dawidek g_topology_assert_not(); 6193650be51SPawel Jakub Dawidek sx_assert(&sc->sc_lock, SX_XLOCKED); 6202d1661a5SPawel Jakub Dawidek 6212d1661a5SPawel Jakub Dawidek gp = sc->sc_geom; 6222d1661a5SPawel Jakub Dawidek if (sc->sc_provider != NULL) 6232d1661a5SPawel Jakub Dawidek g_raid3_destroy_provider(sc); 6249da3072cSPawel Jakub Dawidek for (n = 0; n < sc->sc_ndisks; n++) { 6259da3072cSPawel Jakub Dawidek disk = &sc->sc_disks[n]; 626d97d5ee9SPawel Jakub Dawidek if (disk->d_state != G_RAID3_DISK_STATE_NODISK) { 6279da3072cSPawel Jakub Dawidek disk->d_flags &= ~G_RAID3_DISK_FLAG_DIRTY; 6289da3072cSPawel Jakub Dawidek g_raid3_update_metadata(disk); 6299da3072cSPawel Jakub Dawidek g_raid3_destroy_disk(disk); 6309da3072cSPawel Jakub Dawidek } 631d97d5ee9SPawel Jakub Dawidek } 6322d1661a5SPawel Jakub Dawidek while ((ep = g_raid3_event_get(sc)) != NULL) { 633d97d5ee9SPawel Jakub Dawidek g_raid3_event_remove(sc, ep); 6342d1661a5SPawel Jakub Dawidek if ((ep->e_flags & G_RAID3_EVENT_DONTWAIT) != 0) 6352d1661a5SPawel Jakub Dawidek g_raid3_event_free(ep); 6362d1661a5SPawel Jakub Dawidek else { 6372d1661a5SPawel Jakub Dawidek ep->e_error = ECANCELED; 6382d1661a5SPawel Jakub Dawidek ep->e_flags |= G_RAID3_EVENT_DONE; 6392d1661a5SPawel Jakub Dawidek G_RAID3_DEBUG(4, "%s: Waking up %p.", __func__, ep); 6402d1661a5SPawel Jakub Dawidek mtx_lock(&sc->sc_events_mtx); 6412d1661a5SPawel Jakub Dawidek wakeup(ep); 6422d1661a5SPawel Jakub Dawidek mtx_unlock(&sc->sc_events_mtx); 6432d1661a5SPawel Jakub Dawidek } 6442d1661a5SPawel Jakub Dawidek } 6452d1661a5SPawel Jakub Dawidek callout_drain(&sc->sc_callout); 6462d1661a5SPawel Jakub Dawidek cp = LIST_FIRST(&sc->sc_sync.ds_geom->consumer); 6473650be51SPawel Jakub Dawidek g_topology_lock(); 6482d1661a5SPawel Jakub Dawidek if (cp != NULL) 6492d1661a5SPawel Jakub Dawidek g_raid3_disconnect_consumer(sc, cp); 6502d1661a5SPawel Jakub Dawidek g_wither_geom(sc->sc_sync.ds_geom, ENXIO); 6512d1661a5SPawel Jakub Dawidek G_RAID3_DEBUG(0, "Device %s destroyed.", gp->name); 6522d1661a5SPawel Jakub Dawidek g_wither_geom(gp, ENXIO); 6533650be51SPawel Jakub Dawidek g_topology_unlock(); 654ed940a82SPawel Jakub Dawidek if (!g_raid3_use_malloc) { 6553650be51SPawel Jakub Dawidek uma_zdestroy(sc->sc_zones[G_RAID3_ZONE_64K].sz_zone); 6563650be51SPawel Jakub Dawidek uma_zdestroy(sc->sc_zones[G_RAID3_ZONE_16K].sz_zone); 6573650be51SPawel Jakub Dawidek uma_zdestroy(sc->sc_zones[G_RAID3_ZONE_4K].sz_zone); 658ed940a82SPawel Jakub Dawidek } 6593650be51SPawel Jakub Dawidek mtx_destroy(&sc->sc_queue_mtx); 6603650be51SPawel Jakub Dawidek mtx_destroy(&sc->sc_events_mtx); 6613650be51SPawel Jakub Dawidek sx_xunlock(&sc->sc_lock); 6623650be51SPawel Jakub Dawidek sx_destroy(&sc->sc_lock); 6632d1661a5SPawel Jakub Dawidek } 6642d1661a5SPawel Jakub Dawidek 6652d1661a5SPawel Jakub Dawidek static void 6662d1661a5SPawel Jakub Dawidek g_raid3_orphan(struct g_consumer *cp) 6672d1661a5SPawel Jakub Dawidek { 6682d1661a5SPawel Jakub Dawidek struct g_raid3_disk *disk; 6692d1661a5SPawel Jakub Dawidek 6702d1661a5SPawel Jakub Dawidek g_topology_assert(); 6712d1661a5SPawel Jakub Dawidek 6722d1661a5SPawel Jakub Dawidek disk = cp->private; 6732d1661a5SPawel Jakub Dawidek if (disk == NULL) 6742d1661a5SPawel Jakub Dawidek return; 675ea973705SPawel Jakub Dawidek disk->d_softc->sc_bump_id = G_RAID3_BUMP_SYNCID; 6762d1661a5SPawel Jakub Dawidek g_raid3_event_send(disk, G_RAID3_DISK_STATE_DISCONNECTED, 6772d1661a5SPawel Jakub Dawidek G_RAID3_EVENT_DONTWAIT); 6782d1661a5SPawel Jakub Dawidek } 6792d1661a5SPawel Jakub Dawidek 6802d1661a5SPawel Jakub Dawidek static int 6812d1661a5SPawel Jakub Dawidek g_raid3_write_metadata(struct g_raid3_disk *disk, struct g_raid3_metadata *md) 6822d1661a5SPawel Jakub Dawidek { 6832d1661a5SPawel Jakub Dawidek struct g_raid3_softc *sc; 6842d1661a5SPawel Jakub Dawidek struct g_consumer *cp; 6852d1661a5SPawel Jakub Dawidek off_t offset, length; 6862d1661a5SPawel Jakub Dawidek u_char *sector; 687d97d5ee9SPawel Jakub Dawidek int error = 0; 6882d1661a5SPawel Jakub Dawidek 6893650be51SPawel Jakub Dawidek g_topology_assert_not(); 6902d1661a5SPawel Jakub Dawidek sc = disk->d_softc; 6913650be51SPawel Jakub Dawidek sx_assert(&sc->sc_lock, SX_LOCKED); 6923650be51SPawel Jakub Dawidek 6932d1661a5SPawel Jakub Dawidek cp = disk->d_consumer; 6942d1661a5SPawel Jakub Dawidek KASSERT(cp != NULL, ("NULL consumer (%s).", sc->sc_name)); 6952d1661a5SPawel Jakub Dawidek KASSERT(cp->provider != NULL, ("NULL provider (%s).", sc->sc_name)); 6963650be51SPawel Jakub Dawidek KASSERT(cp->acr >= 1 && cp->acw >= 1 && cp->ace >= 1, 697d97d5ee9SPawel Jakub Dawidek ("Consumer %s closed? (r%dw%de%d).", cp->provider->name, cp->acr, 698d97d5ee9SPawel Jakub Dawidek cp->acw, cp->ace)); 6992d1661a5SPawel Jakub Dawidek length = cp->provider->sectorsize; 7002d1661a5SPawel Jakub Dawidek offset = cp->provider->mediasize - length; 7012d1661a5SPawel Jakub Dawidek sector = malloc((size_t)length, M_RAID3, M_WAITOK | M_ZERO); 7022d1661a5SPawel Jakub Dawidek if (md != NULL) 7032d1661a5SPawel Jakub Dawidek raid3_metadata_encode(md, sector); 7042d1661a5SPawel Jakub Dawidek error = g_write_data(cp, offset, sector, length); 7052d1661a5SPawel Jakub Dawidek free(sector, M_RAID3); 7062d1661a5SPawel Jakub Dawidek if (error != 0) { 7073aae74ecSPawel Jakub Dawidek if ((disk->d_flags & G_RAID3_DISK_FLAG_BROKEN) == 0) { 7083aae74ecSPawel Jakub Dawidek G_RAID3_DEBUG(0, "Cannot write metadata on %s " 7093aae74ecSPawel Jakub Dawidek "(device=%s, error=%d).", 7103aae74ecSPawel Jakub Dawidek g_raid3_get_diskname(disk), sc->sc_name, error); 7113aae74ecSPawel Jakub Dawidek disk->d_flags |= G_RAID3_DISK_FLAG_BROKEN; 7123aae74ecSPawel Jakub Dawidek } else { 7133aae74ecSPawel Jakub Dawidek G_RAID3_DEBUG(1, "Cannot write metadata on %s " 7143aae74ecSPawel Jakub Dawidek "(device=%s, error=%d).", 7153aae74ecSPawel Jakub Dawidek g_raid3_get_diskname(disk), sc->sc_name, error); 7163aae74ecSPawel Jakub Dawidek } 7173aae74ecSPawel Jakub Dawidek if (g_raid3_disconnect_on_failure && 7183aae74ecSPawel Jakub Dawidek sc->sc_state == G_RAID3_DEVICE_STATE_COMPLETE) { 7193aae74ecSPawel Jakub Dawidek sc->sc_bump_id |= G_RAID3_BUMP_GENID; 7203aae74ecSPawel Jakub Dawidek g_raid3_event_send(disk, 7213aae74ecSPawel Jakub Dawidek G_RAID3_DISK_STATE_DISCONNECTED, 7222d1661a5SPawel Jakub Dawidek G_RAID3_EVENT_DONTWAIT); 7232d1661a5SPawel Jakub Dawidek } 7243aae74ecSPawel Jakub Dawidek } 7252d1661a5SPawel Jakub Dawidek return (error); 7262d1661a5SPawel Jakub Dawidek } 7272d1661a5SPawel Jakub Dawidek 7282d1661a5SPawel Jakub Dawidek int 7292d1661a5SPawel Jakub Dawidek g_raid3_clear_metadata(struct g_raid3_disk *disk) 7302d1661a5SPawel Jakub Dawidek { 7312d1661a5SPawel Jakub Dawidek int error; 7322d1661a5SPawel Jakub Dawidek 7333650be51SPawel Jakub Dawidek g_topology_assert_not(); 7343650be51SPawel Jakub Dawidek sx_assert(&disk->d_softc->sc_lock, SX_LOCKED); 7353650be51SPawel Jakub Dawidek 7362d1661a5SPawel Jakub Dawidek error = g_raid3_write_metadata(disk, NULL); 7372d1661a5SPawel Jakub Dawidek if (error == 0) { 7382d1661a5SPawel Jakub Dawidek G_RAID3_DEBUG(2, "Metadata on %s cleared.", 7392d1661a5SPawel Jakub Dawidek g_raid3_get_diskname(disk)); 7402d1661a5SPawel Jakub Dawidek } else { 7412d1661a5SPawel Jakub Dawidek G_RAID3_DEBUG(0, 7422d1661a5SPawel Jakub Dawidek "Cannot clear metadata on disk %s (error=%d).", 7432d1661a5SPawel Jakub Dawidek g_raid3_get_diskname(disk), error); 7442d1661a5SPawel Jakub Dawidek } 7452d1661a5SPawel Jakub Dawidek return (error); 7462d1661a5SPawel Jakub Dawidek } 7472d1661a5SPawel Jakub Dawidek 7482d1661a5SPawel Jakub Dawidek void 7492d1661a5SPawel Jakub Dawidek g_raid3_fill_metadata(struct g_raid3_disk *disk, struct g_raid3_metadata *md) 7502d1661a5SPawel Jakub Dawidek { 7512d1661a5SPawel Jakub Dawidek struct g_raid3_softc *sc; 752e6890985SPawel Jakub Dawidek struct g_provider *pp; 7532d1661a5SPawel Jakub Dawidek 7542d1661a5SPawel Jakub Dawidek sc = disk->d_softc; 7552d1661a5SPawel Jakub Dawidek strlcpy(md->md_magic, G_RAID3_MAGIC, sizeof(md->md_magic)); 7562d1661a5SPawel Jakub Dawidek md->md_version = G_RAID3_VERSION; 7572d1661a5SPawel Jakub Dawidek strlcpy(md->md_name, sc->sc_name, sizeof(md->md_name)); 7582d1661a5SPawel Jakub Dawidek md->md_id = sc->sc_id; 7592d1661a5SPawel Jakub Dawidek md->md_all = sc->sc_ndisks; 760a245a548SPawel Jakub Dawidek md->md_genid = sc->sc_genid; 7612d1661a5SPawel Jakub Dawidek md->md_mediasize = sc->sc_mediasize; 7622d1661a5SPawel Jakub Dawidek md->md_sectorsize = sc->sc_sectorsize; 7632d1661a5SPawel Jakub Dawidek md->md_mflags = (sc->sc_flags & G_RAID3_DEVICE_FLAG_MASK); 7642d1661a5SPawel Jakub Dawidek md->md_no = disk->d_no; 7652d1661a5SPawel Jakub Dawidek md->md_syncid = disk->d_sync.ds_syncid; 7662d1661a5SPawel Jakub Dawidek md->md_dflags = (disk->d_flags & G_RAID3_DISK_FLAG_MASK); 767c082905bSPawel Jakub Dawidek if (disk->d_state != G_RAID3_DISK_STATE_SYNCHRONIZING) 7682d1661a5SPawel Jakub Dawidek md->md_sync_offset = 0; 769c082905bSPawel Jakub Dawidek else { 770c082905bSPawel Jakub Dawidek md->md_sync_offset = 771c082905bSPawel Jakub Dawidek disk->d_sync.ds_offset_done / (sc->sc_ndisks - 1); 772c082905bSPawel Jakub Dawidek } 773e6890985SPawel Jakub Dawidek if (disk->d_consumer != NULL && disk->d_consumer->provider != NULL) 774e6890985SPawel Jakub Dawidek pp = disk->d_consumer->provider; 775e6890985SPawel Jakub Dawidek else 776e6890985SPawel Jakub Dawidek pp = NULL; 777e6890985SPawel Jakub Dawidek if ((disk->d_flags & G_RAID3_DISK_FLAG_HARDCODED) != 0 && pp != NULL) 778e6890985SPawel Jakub Dawidek strlcpy(md->md_provider, pp->name, sizeof(md->md_provider)); 779e6890985SPawel Jakub Dawidek else 7802d1661a5SPawel Jakub Dawidek bzero(md->md_provider, sizeof(md->md_provider)); 781e6890985SPawel Jakub Dawidek if (pp != NULL) 782e6890985SPawel Jakub Dawidek md->md_provsize = pp->mediasize; 783e6890985SPawel Jakub Dawidek else 784e6890985SPawel Jakub Dawidek md->md_provsize = 0; 7852d1661a5SPawel Jakub Dawidek } 7862d1661a5SPawel Jakub Dawidek 7872d1661a5SPawel Jakub Dawidek void 7882d1661a5SPawel Jakub Dawidek g_raid3_update_metadata(struct g_raid3_disk *disk) 7892d1661a5SPawel Jakub Dawidek { 7903650be51SPawel Jakub Dawidek struct g_raid3_softc *sc; 7912d1661a5SPawel Jakub Dawidek struct g_raid3_metadata md; 7922d1661a5SPawel Jakub Dawidek int error; 7932d1661a5SPawel Jakub Dawidek 7943650be51SPawel Jakub Dawidek g_topology_assert_not(); 7953650be51SPawel Jakub Dawidek sc = disk->d_softc; 7963650be51SPawel Jakub Dawidek sx_assert(&sc->sc_lock, SX_LOCKED); 7973650be51SPawel Jakub Dawidek 7982d1661a5SPawel Jakub Dawidek g_raid3_fill_metadata(disk, &md); 7992d1661a5SPawel Jakub Dawidek error = g_raid3_write_metadata(disk, &md); 8002d1661a5SPawel Jakub Dawidek if (error == 0) { 8012d1661a5SPawel Jakub Dawidek G_RAID3_DEBUG(2, "Metadata on %s updated.", 8022d1661a5SPawel Jakub Dawidek g_raid3_get_diskname(disk)); 8032d1661a5SPawel Jakub Dawidek } else { 8042d1661a5SPawel Jakub Dawidek G_RAID3_DEBUG(0, 8052d1661a5SPawel Jakub Dawidek "Cannot update metadata on disk %s (error=%d).", 8062d1661a5SPawel Jakub Dawidek g_raid3_get_diskname(disk), error); 8072d1661a5SPawel Jakub Dawidek } 8082d1661a5SPawel Jakub Dawidek } 8092d1661a5SPawel Jakub Dawidek 8102d1661a5SPawel Jakub Dawidek static void 811d97d5ee9SPawel Jakub Dawidek g_raid3_bump_syncid(struct g_raid3_softc *sc) 8122d1661a5SPawel Jakub Dawidek { 8132d1661a5SPawel Jakub Dawidek struct g_raid3_disk *disk; 8142d1661a5SPawel Jakub Dawidek u_int n; 8152d1661a5SPawel Jakub Dawidek 8163650be51SPawel Jakub Dawidek g_topology_assert_not(); 8173650be51SPawel Jakub Dawidek sx_assert(&sc->sc_lock, SX_XLOCKED); 8182d1661a5SPawel Jakub Dawidek KASSERT(g_raid3_ndisks(sc, G_RAID3_DISK_STATE_ACTIVE) > 0, 8192d1661a5SPawel Jakub Dawidek ("%s called with no active disks (device=%s).", __func__, 8202d1661a5SPawel Jakub Dawidek sc->sc_name)); 8212d1661a5SPawel Jakub Dawidek 8222d1661a5SPawel Jakub Dawidek sc->sc_syncid++; 823a245a548SPawel Jakub Dawidek G_RAID3_DEBUG(1, "Device %s: syncid bumped to %u.", sc->sc_name, 824a245a548SPawel Jakub Dawidek sc->sc_syncid); 8252d1661a5SPawel Jakub Dawidek for (n = 0; n < sc->sc_ndisks; n++) { 8262d1661a5SPawel Jakub Dawidek disk = &sc->sc_disks[n]; 8272d1661a5SPawel Jakub Dawidek if (disk->d_state == G_RAID3_DISK_STATE_ACTIVE || 8282d1661a5SPawel Jakub Dawidek disk->d_state == G_RAID3_DISK_STATE_SYNCHRONIZING) { 8292d1661a5SPawel Jakub Dawidek disk->d_sync.ds_syncid = sc->sc_syncid; 8302d1661a5SPawel Jakub Dawidek g_raid3_update_metadata(disk); 8312d1661a5SPawel Jakub Dawidek } 8322d1661a5SPawel Jakub Dawidek } 8332d1661a5SPawel Jakub Dawidek } 8342d1661a5SPawel Jakub Dawidek 8354d006a98SPawel Jakub Dawidek static void 836a245a548SPawel Jakub Dawidek g_raid3_bump_genid(struct g_raid3_softc *sc) 837a245a548SPawel Jakub Dawidek { 838a245a548SPawel Jakub Dawidek struct g_raid3_disk *disk; 839a245a548SPawel Jakub Dawidek u_int n; 840a245a548SPawel Jakub Dawidek 8413650be51SPawel Jakub Dawidek g_topology_assert_not(); 8423650be51SPawel Jakub Dawidek sx_assert(&sc->sc_lock, SX_XLOCKED); 843a245a548SPawel Jakub Dawidek KASSERT(g_raid3_ndisks(sc, G_RAID3_DISK_STATE_ACTIVE) > 0, 844a245a548SPawel Jakub Dawidek ("%s called with no active disks (device=%s).", __func__, 845a245a548SPawel Jakub Dawidek sc->sc_name)); 846a245a548SPawel Jakub Dawidek 847a245a548SPawel Jakub Dawidek sc->sc_genid++; 848a245a548SPawel Jakub Dawidek G_RAID3_DEBUG(1, "Device %s: genid bumped to %u.", sc->sc_name, 849a245a548SPawel Jakub Dawidek sc->sc_genid); 850a245a548SPawel Jakub Dawidek for (n = 0; n < sc->sc_ndisks; n++) { 851a245a548SPawel Jakub Dawidek disk = &sc->sc_disks[n]; 852a245a548SPawel Jakub Dawidek if (disk->d_state == G_RAID3_DISK_STATE_ACTIVE || 853a245a548SPawel Jakub Dawidek disk->d_state == G_RAID3_DISK_STATE_SYNCHRONIZING) { 854a245a548SPawel Jakub Dawidek disk->d_genid = sc->sc_genid; 855a245a548SPawel Jakub Dawidek g_raid3_update_metadata(disk); 856a245a548SPawel Jakub Dawidek } 857a245a548SPawel Jakub Dawidek } 858a245a548SPawel Jakub Dawidek } 859a245a548SPawel Jakub Dawidek 8600962f942SPawel Jakub Dawidek static int 8613650be51SPawel Jakub Dawidek g_raid3_idle(struct g_raid3_softc *sc, int acw) 8624d006a98SPawel Jakub Dawidek { 8634d006a98SPawel Jakub Dawidek struct g_raid3_disk *disk; 8644d006a98SPawel Jakub Dawidek u_int i; 8650962f942SPawel Jakub Dawidek int timeout; 8664d006a98SPawel Jakub Dawidek 8673650be51SPawel Jakub Dawidek g_topology_assert_not(); 8683650be51SPawel Jakub Dawidek sx_assert(&sc->sc_lock, SX_XLOCKED); 8693650be51SPawel Jakub Dawidek 8700962f942SPawel Jakub Dawidek if (sc->sc_provider == NULL) 8710962f942SPawel Jakub Dawidek return (0); 872501250baSPawel Jakub Dawidek if ((sc->sc_flags & G_RAID3_DEVICE_FLAG_NOFAILSYNC) != 0) 873501250baSPawel Jakub Dawidek return (0); 8740962f942SPawel Jakub Dawidek if (sc->sc_idle) 8750962f942SPawel Jakub Dawidek return (0); 8760962f942SPawel Jakub Dawidek if (sc->sc_writes > 0) 8770962f942SPawel Jakub Dawidek return (0); 8783650be51SPawel Jakub Dawidek if (acw > 0 || (acw == -1 && sc->sc_provider->acw > 0)) { 87901f1f41cSPawel Jakub Dawidek timeout = g_raid3_idletime - (time_uptime - sc->sc_last_write); 880f62c1a47SAlexander Motin if (!g_raid3_shutdown && timeout > 0) 8810962f942SPawel Jakub Dawidek return (timeout); 8820962f942SPawel Jakub Dawidek } 8834d006a98SPawel Jakub Dawidek sc->sc_idle = 1; 8844d006a98SPawel Jakub Dawidek for (i = 0; i < sc->sc_ndisks; i++) { 8854d006a98SPawel Jakub Dawidek disk = &sc->sc_disks[i]; 8864d006a98SPawel Jakub Dawidek if (disk->d_state != G_RAID3_DISK_STATE_ACTIVE) 8874d006a98SPawel Jakub Dawidek continue; 8884d006a98SPawel Jakub Dawidek G_RAID3_DEBUG(1, "Disk %s (device %s) marked as clean.", 8894d006a98SPawel Jakub Dawidek g_raid3_get_diskname(disk), sc->sc_name); 8904d006a98SPawel Jakub Dawidek disk->d_flags &= ~G_RAID3_DISK_FLAG_DIRTY; 8914d006a98SPawel Jakub Dawidek g_raid3_update_metadata(disk); 8924d006a98SPawel Jakub Dawidek } 8930962f942SPawel Jakub Dawidek return (0); 8944d006a98SPawel Jakub Dawidek } 8954d006a98SPawel Jakub Dawidek 8964d006a98SPawel Jakub Dawidek static void 8974d006a98SPawel Jakub Dawidek g_raid3_unidle(struct g_raid3_softc *sc) 8984d006a98SPawel Jakub Dawidek { 8994d006a98SPawel Jakub Dawidek struct g_raid3_disk *disk; 9004d006a98SPawel Jakub Dawidek u_int i; 9014d006a98SPawel Jakub Dawidek 9023650be51SPawel Jakub Dawidek g_topology_assert_not(); 9033650be51SPawel Jakub Dawidek sx_assert(&sc->sc_lock, SX_XLOCKED); 9043650be51SPawel Jakub Dawidek 905501250baSPawel Jakub Dawidek if ((sc->sc_flags & G_RAID3_DEVICE_FLAG_NOFAILSYNC) != 0) 906501250baSPawel Jakub Dawidek return; 9074d006a98SPawel Jakub Dawidek sc->sc_idle = 0; 90801f1f41cSPawel Jakub Dawidek sc->sc_last_write = time_uptime; 9094d006a98SPawel Jakub Dawidek for (i = 0; i < sc->sc_ndisks; i++) { 9104d006a98SPawel Jakub Dawidek disk = &sc->sc_disks[i]; 9114d006a98SPawel Jakub Dawidek if (disk->d_state != G_RAID3_DISK_STATE_ACTIVE) 9124d006a98SPawel Jakub Dawidek continue; 9134d006a98SPawel Jakub Dawidek G_RAID3_DEBUG(1, "Disk %s (device %s) marked as dirty.", 9144d006a98SPawel Jakub Dawidek g_raid3_get_diskname(disk), sc->sc_name); 9154d006a98SPawel Jakub Dawidek disk->d_flags |= G_RAID3_DISK_FLAG_DIRTY; 9164d006a98SPawel Jakub Dawidek g_raid3_update_metadata(disk); 9174d006a98SPawel Jakub Dawidek } 9184d006a98SPawel Jakub Dawidek } 9194d006a98SPawel Jakub Dawidek 9202d1661a5SPawel Jakub Dawidek /* 9212d1661a5SPawel Jakub Dawidek * Treat bio_driver1 field in parent bio as list head and field bio_caller1 9222d1661a5SPawel Jakub Dawidek * in child bio as pointer to the next element on the list. 9232d1661a5SPawel Jakub Dawidek */ 9242d1661a5SPawel Jakub Dawidek #define G_RAID3_HEAD_BIO(pbp) (pbp)->bio_driver1 9252d1661a5SPawel Jakub Dawidek 9262d1661a5SPawel Jakub Dawidek #define G_RAID3_NEXT_BIO(cbp) (cbp)->bio_caller1 9272d1661a5SPawel Jakub Dawidek 9282d1661a5SPawel Jakub Dawidek #define G_RAID3_FOREACH_BIO(pbp, bp) \ 9292d1661a5SPawel Jakub Dawidek for ((bp) = G_RAID3_HEAD_BIO(pbp); (bp) != NULL; \ 9302d1661a5SPawel Jakub Dawidek (bp) = G_RAID3_NEXT_BIO(bp)) 9312d1661a5SPawel Jakub Dawidek 9322d1661a5SPawel Jakub Dawidek #define G_RAID3_FOREACH_SAFE_BIO(pbp, bp, tmpbp) \ 9332d1661a5SPawel Jakub Dawidek for ((bp) = G_RAID3_HEAD_BIO(pbp); \ 9342d1661a5SPawel Jakub Dawidek (bp) != NULL && ((tmpbp) = G_RAID3_NEXT_BIO(bp), 1); \ 9352d1661a5SPawel Jakub Dawidek (bp) = (tmpbp)) 9362d1661a5SPawel Jakub Dawidek 9372d1661a5SPawel Jakub Dawidek static void 9382d1661a5SPawel Jakub Dawidek g_raid3_init_bio(struct bio *pbp) 9392d1661a5SPawel Jakub Dawidek { 9402d1661a5SPawel Jakub Dawidek 9412d1661a5SPawel Jakub Dawidek G_RAID3_HEAD_BIO(pbp) = NULL; 9422d1661a5SPawel Jakub Dawidek } 9432d1661a5SPawel Jakub Dawidek 9442d1661a5SPawel Jakub Dawidek static void 945dba915cfSPawel Jakub Dawidek g_raid3_remove_bio(struct bio *cbp) 946dba915cfSPawel Jakub Dawidek { 947dba915cfSPawel Jakub Dawidek struct bio *pbp, *bp; 948dba915cfSPawel Jakub Dawidek 949dba915cfSPawel Jakub Dawidek pbp = cbp->bio_parent; 950dba915cfSPawel Jakub Dawidek if (G_RAID3_HEAD_BIO(pbp) == cbp) 951dba915cfSPawel Jakub Dawidek G_RAID3_HEAD_BIO(pbp) = G_RAID3_NEXT_BIO(cbp); 952dba915cfSPawel Jakub Dawidek else { 953dba915cfSPawel Jakub Dawidek G_RAID3_FOREACH_BIO(pbp, bp) { 954dba915cfSPawel Jakub Dawidek if (G_RAID3_NEXT_BIO(bp) == cbp) { 955dba915cfSPawel Jakub Dawidek G_RAID3_NEXT_BIO(bp) = G_RAID3_NEXT_BIO(cbp); 956dba915cfSPawel Jakub Dawidek break; 957dba915cfSPawel Jakub Dawidek } 958dba915cfSPawel Jakub Dawidek } 959dba915cfSPawel Jakub Dawidek } 960dba915cfSPawel Jakub Dawidek G_RAID3_NEXT_BIO(cbp) = NULL; 961dba915cfSPawel Jakub Dawidek } 962dba915cfSPawel Jakub Dawidek 963dba915cfSPawel Jakub Dawidek static void 964dba915cfSPawel Jakub Dawidek g_raid3_replace_bio(struct bio *sbp, struct bio *dbp) 965dba915cfSPawel Jakub Dawidek { 966dba915cfSPawel Jakub Dawidek struct bio *pbp, *bp; 967dba915cfSPawel Jakub Dawidek 968dba915cfSPawel Jakub Dawidek g_raid3_remove_bio(sbp); 969dba915cfSPawel Jakub Dawidek pbp = dbp->bio_parent; 970dba915cfSPawel Jakub Dawidek G_RAID3_NEXT_BIO(sbp) = G_RAID3_NEXT_BIO(dbp); 971dba915cfSPawel Jakub Dawidek if (G_RAID3_HEAD_BIO(pbp) == dbp) 972dba915cfSPawel Jakub Dawidek G_RAID3_HEAD_BIO(pbp) = sbp; 973dba915cfSPawel Jakub Dawidek else { 974dba915cfSPawel Jakub Dawidek G_RAID3_FOREACH_BIO(pbp, bp) { 975dba915cfSPawel Jakub Dawidek if (G_RAID3_NEXT_BIO(bp) == dbp) { 976dba915cfSPawel Jakub Dawidek G_RAID3_NEXT_BIO(bp) = sbp; 977dba915cfSPawel Jakub Dawidek break; 978dba915cfSPawel Jakub Dawidek } 979dba915cfSPawel Jakub Dawidek } 980dba915cfSPawel Jakub Dawidek } 981dba915cfSPawel Jakub Dawidek G_RAID3_NEXT_BIO(dbp) = NULL; 982dba915cfSPawel Jakub Dawidek } 983dba915cfSPawel Jakub Dawidek 984dba915cfSPawel Jakub Dawidek static void 9852d1661a5SPawel Jakub Dawidek g_raid3_destroy_bio(struct g_raid3_softc *sc, struct bio *cbp) 9862d1661a5SPawel Jakub Dawidek { 9872d1661a5SPawel Jakub Dawidek struct bio *bp, *pbp; 9882d1661a5SPawel Jakub Dawidek size_t size; 9892d1661a5SPawel Jakub Dawidek 9902d1661a5SPawel Jakub Dawidek pbp = cbp->bio_parent; 9912d1661a5SPawel Jakub Dawidek pbp->bio_children--; 9922d1661a5SPawel Jakub Dawidek KASSERT(cbp->bio_data != NULL, ("NULL bio_data")); 9932d1661a5SPawel Jakub Dawidek size = pbp->bio_length / (sc->sc_ndisks - 1); 994ed940a82SPawel Jakub Dawidek g_raid3_free(sc, cbp->bio_data, size); 9952d1661a5SPawel Jakub Dawidek if (G_RAID3_HEAD_BIO(pbp) == cbp) { 9962d1661a5SPawel Jakub Dawidek G_RAID3_HEAD_BIO(pbp) = G_RAID3_NEXT_BIO(cbp); 9972d1661a5SPawel Jakub Dawidek G_RAID3_NEXT_BIO(cbp) = NULL; 9982d1661a5SPawel Jakub Dawidek g_destroy_bio(cbp); 9992d1661a5SPawel Jakub Dawidek } else { 10002d1661a5SPawel Jakub Dawidek G_RAID3_FOREACH_BIO(pbp, bp) { 10012d1661a5SPawel Jakub Dawidek if (G_RAID3_NEXT_BIO(bp) == cbp) 10022d1661a5SPawel Jakub Dawidek break; 10032d1661a5SPawel Jakub Dawidek } 1004dba915cfSPawel Jakub Dawidek if (bp != NULL) { 1005dba915cfSPawel Jakub Dawidek KASSERT(G_RAID3_NEXT_BIO(bp) != NULL, 1006dba915cfSPawel Jakub Dawidek ("NULL bp->bio_driver1")); 10072d1661a5SPawel Jakub Dawidek G_RAID3_NEXT_BIO(bp) = G_RAID3_NEXT_BIO(cbp); 10082d1661a5SPawel Jakub Dawidek G_RAID3_NEXT_BIO(cbp) = NULL; 1009dba915cfSPawel Jakub Dawidek } 10102d1661a5SPawel Jakub Dawidek g_destroy_bio(cbp); 10112d1661a5SPawel Jakub Dawidek } 10122d1661a5SPawel Jakub Dawidek } 10132d1661a5SPawel Jakub Dawidek 10142d1661a5SPawel Jakub Dawidek static struct bio * 10152d1661a5SPawel Jakub Dawidek g_raid3_clone_bio(struct g_raid3_softc *sc, struct bio *pbp) 10162d1661a5SPawel Jakub Dawidek { 10172d1661a5SPawel Jakub Dawidek struct bio *bp, *cbp; 10182d1661a5SPawel Jakub Dawidek size_t size; 10193650be51SPawel Jakub Dawidek int memflag; 10202d1661a5SPawel Jakub Dawidek 10212d1661a5SPawel Jakub Dawidek cbp = g_clone_bio(pbp); 10222d1661a5SPawel Jakub Dawidek if (cbp == NULL) 10232d1661a5SPawel Jakub Dawidek return (NULL); 10242d1661a5SPawel Jakub Dawidek size = pbp->bio_length / (sc->sc_ndisks - 1); 10253650be51SPawel Jakub Dawidek if ((pbp->bio_cflags & G_RAID3_BIO_CFLAG_REGULAR) != 0) 10263650be51SPawel Jakub Dawidek memflag = M_WAITOK; 10272d1661a5SPawel Jakub Dawidek else 10283650be51SPawel Jakub Dawidek memflag = M_NOWAIT; 1029ed940a82SPawel Jakub Dawidek cbp->bio_data = g_raid3_alloc(sc, size, memflag); 10303650be51SPawel Jakub Dawidek if (cbp->bio_data == NULL) { 10312d1661a5SPawel Jakub Dawidek pbp->bio_children--; 10322d1661a5SPawel Jakub Dawidek g_destroy_bio(cbp); 10332d1661a5SPawel Jakub Dawidek return (NULL); 10342d1661a5SPawel Jakub Dawidek } 10352d1661a5SPawel Jakub Dawidek G_RAID3_NEXT_BIO(cbp) = NULL; 10362d1661a5SPawel Jakub Dawidek if (G_RAID3_HEAD_BIO(pbp) == NULL) 10372d1661a5SPawel Jakub Dawidek G_RAID3_HEAD_BIO(pbp) = cbp; 10382d1661a5SPawel Jakub Dawidek else { 10392d1661a5SPawel Jakub Dawidek G_RAID3_FOREACH_BIO(pbp, bp) { 10402d1661a5SPawel Jakub Dawidek if (G_RAID3_NEXT_BIO(bp) == NULL) { 10412d1661a5SPawel Jakub Dawidek G_RAID3_NEXT_BIO(bp) = cbp; 10422d1661a5SPawel Jakub Dawidek break; 10432d1661a5SPawel Jakub Dawidek } 10442d1661a5SPawel Jakub Dawidek } 10452d1661a5SPawel Jakub Dawidek } 10462d1661a5SPawel Jakub Dawidek return (cbp); 10472d1661a5SPawel Jakub Dawidek } 10482d1661a5SPawel Jakub Dawidek 10492d1661a5SPawel Jakub Dawidek static void 10502d1661a5SPawel Jakub Dawidek g_raid3_scatter(struct bio *pbp) 10512d1661a5SPawel Jakub Dawidek { 10522d1661a5SPawel Jakub Dawidek struct g_raid3_softc *sc; 10532d1661a5SPawel Jakub Dawidek struct g_raid3_disk *disk; 1054ee40c7aaSPawel Jakub Dawidek struct bio *bp, *cbp, *tmpbp; 10552d1661a5SPawel Jakub Dawidek off_t atom, cadd, padd, left; 105606b215fdSAlexander Motin int first; 10572d1661a5SPawel Jakub Dawidek 10582d1661a5SPawel Jakub Dawidek sc = pbp->bio_to->geom->softc; 10592d1661a5SPawel Jakub Dawidek bp = NULL; 10602d1661a5SPawel Jakub Dawidek if ((pbp->bio_pflags & G_RAID3_BIO_PFLAG_NOPARITY) == 0) { 10612d1661a5SPawel Jakub Dawidek /* 10622d1661a5SPawel Jakub Dawidek * Find bio for which we should calculate data. 10632d1661a5SPawel Jakub Dawidek */ 10642d1661a5SPawel Jakub Dawidek G_RAID3_FOREACH_BIO(pbp, cbp) { 10652d1661a5SPawel Jakub Dawidek if ((cbp->bio_cflags & G_RAID3_BIO_CFLAG_PARITY) != 0) { 10662d1661a5SPawel Jakub Dawidek bp = cbp; 10672d1661a5SPawel Jakub Dawidek break; 10682d1661a5SPawel Jakub Dawidek } 10692d1661a5SPawel Jakub Dawidek } 10702d1661a5SPawel Jakub Dawidek KASSERT(bp != NULL, ("NULL parity bio.")); 10712d1661a5SPawel Jakub Dawidek } 10722d1661a5SPawel Jakub Dawidek atom = sc->sc_sectorsize / (sc->sc_ndisks - 1); 10732d1661a5SPawel Jakub Dawidek cadd = padd = 0; 10742d1661a5SPawel Jakub Dawidek for (left = pbp->bio_length; left > 0; left -= sc->sc_sectorsize) { 10752d1661a5SPawel Jakub Dawidek G_RAID3_FOREACH_BIO(pbp, cbp) { 10762d1661a5SPawel Jakub Dawidek if (cbp == bp) 10772d1661a5SPawel Jakub Dawidek continue; 10782d1661a5SPawel Jakub Dawidek bcopy(pbp->bio_data + padd, cbp->bio_data + cadd, atom); 10792d1661a5SPawel Jakub Dawidek padd += atom; 10802d1661a5SPawel Jakub Dawidek } 10812d1661a5SPawel Jakub Dawidek cadd += atom; 10822d1661a5SPawel Jakub Dawidek } 10832d1661a5SPawel Jakub Dawidek if ((pbp->bio_pflags & G_RAID3_BIO_PFLAG_NOPARITY) == 0) { 10842d1661a5SPawel Jakub Dawidek /* 10852d1661a5SPawel Jakub Dawidek * Calculate parity. 10862d1661a5SPawel Jakub Dawidek */ 108706b215fdSAlexander Motin first = 1; 10882d1661a5SPawel Jakub Dawidek G_RAID3_FOREACH_SAFE_BIO(pbp, cbp, tmpbp) { 10892d1661a5SPawel Jakub Dawidek if (cbp == bp) 10902d1661a5SPawel Jakub Dawidek continue; 109106b215fdSAlexander Motin if (first) { 109206b215fdSAlexander Motin bcopy(cbp->bio_data, bp->bio_data, 10932d1661a5SPawel Jakub Dawidek bp->bio_length); 109406b215fdSAlexander Motin first = 0; 109506b215fdSAlexander Motin } else { 109606b215fdSAlexander Motin g_raid3_xor(cbp->bio_data, bp->bio_data, 109706b215fdSAlexander Motin bp->bio_length); 109806b215fdSAlexander Motin } 10992d1661a5SPawel Jakub Dawidek if ((cbp->bio_cflags & G_RAID3_BIO_CFLAG_NODISK) != 0) 11002d1661a5SPawel Jakub Dawidek g_raid3_destroy_bio(sc, cbp); 11012d1661a5SPawel Jakub Dawidek } 11022d1661a5SPawel Jakub Dawidek } 1103ee40c7aaSPawel Jakub Dawidek G_RAID3_FOREACH_SAFE_BIO(pbp, cbp, tmpbp) { 11042d1661a5SPawel Jakub Dawidek struct g_consumer *cp; 11052d1661a5SPawel Jakub Dawidek 11062d1661a5SPawel Jakub Dawidek disk = cbp->bio_caller2; 11072d1661a5SPawel Jakub Dawidek cp = disk->d_consumer; 11082d1661a5SPawel Jakub Dawidek cbp->bio_to = cp->provider; 11092d1661a5SPawel Jakub Dawidek G_RAID3_LOGREQ(3, cbp, "Sending request."); 11103650be51SPawel Jakub Dawidek KASSERT(cp->acr >= 1 && cp->acw >= 1 && cp->ace >= 1, 1111d97d5ee9SPawel Jakub Dawidek ("Consumer %s not opened (r%dw%de%d).", cp->provider->name, 1112d97d5ee9SPawel Jakub Dawidek cp->acr, cp->acw, cp->ace)); 111379e61493SPawel Jakub Dawidek cp->index++; 11140962f942SPawel Jakub Dawidek sc->sc_writes++; 11152d1661a5SPawel Jakub Dawidek g_io_request(cbp, cp); 11162d1661a5SPawel Jakub Dawidek } 11172d1661a5SPawel Jakub Dawidek } 11182d1661a5SPawel Jakub Dawidek 11192d1661a5SPawel Jakub Dawidek static void 11202d1661a5SPawel Jakub Dawidek g_raid3_gather(struct bio *pbp) 11212d1661a5SPawel Jakub Dawidek { 11222d1661a5SPawel Jakub Dawidek struct g_raid3_softc *sc; 11232d1661a5SPawel Jakub Dawidek struct g_raid3_disk *disk; 1124f5a2f7feSPawel Jakub Dawidek struct bio *xbp, *fbp, *cbp; 11252d1661a5SPawel Jakub Dawidek off_t atom, cadd, padd, left; 11262d1661a5SPawel Jakub Dawidek 11272d1661a5SPawel Jakub Dawidek sc = pbp->bio_to->geom->softc; 11282d1661a5SPawel Jakub Dawidek /* 1129f5a2f7feSPawel Jakub Dawidek * Find bio for which we have to calculate data. 11302d1661a5SPawel Jakub Dawidek * While going through this path, check if all requests 11312d1661a5SPawel Jakub Dawidek * succeeded, if not, deny whole request. 1132f5a2f7feSPawel Jakub Dawidek * If we're in COMPLETE mode, we allow one request to fail, 1133f5a2f7feSPawel Jakub Dawidek * so if we find one, we're sending it to the parity consumer. 1134f5a2f7feSPawel Jakub Dawidek * If there are more failed requests, we deny whole request. 11352d1661a5SPawel Jakub Dawidek */ 1136f5a2f7feSPawel Jakub Dawidek xbp = fbp = NULL; 11372d1661a5SPawel Jakub Dawidek G_RAID3_FOREACH_BIO(pbp, cbp) { 11382d1661a5SPawel Jakub Dawidek if ((cbp->bio_cflags & G_RAID3_BIO_CFLAG_PARITY) != 0) { 1139f5a2f7feSPawel Jakub Dawidek KASSERT(xbp == NULL, ("More than one parity bio.")); 1140f5a2f7feSPawel Jakub Dawidek xbp = cbp; 11412d1661a5SPawel Jakub Dawidek } 11422d1661a5SPawel Jakub Dawidek if (cbp->bio_error == 0) 11432d1661a5SPawel Jakub Dawidek continue; 11442d1661a5SPawel Jakub Dawidek /* 11452d1661a5SPawel Jakub Dawidek * Found failed request. 11462d1661a5SPawel Jakub Dawidek */ 1147f5a2f7feSPawel Jakub Dawidek if (fbp == NULL) { 1148f5a2f7feSPawel Jakub Dawidek if ((pbp->bio_pflags & G_RAID3_BIO_PFLAG_DEGRADED) != 0) { 11492d1661a5SPawel Jakub Dawidek /* 1150f5a2f7feSPawel Jakub Dawidek * We are already in degraded mode, so we can't 1151f5a2f7feSPawel Jakub Dawidek * accept any failures. 11522d1661a5SPawel Jakub Dawidek */ 1153f5a2f7feSPawel Jakub Dawidek if (pbp->bio_error == 0) 115417fec17eSPawel Jakub Dawidek pbp->bio_error = cbp->bio_error; 11552d1661a5SPawel Jakub Dawidek } else { 1156f5a2f7feSPawel Jakub Dawidek fbp = cbp; 11572d1661a5SPawel Jakub Dawidek } 1158f5a2f7feSPawel Jakub Dawidek } else { 11592d1661a5SPawel Jakub Dawidek /* 11602d1661a5SPawel Jakub Dawidek * Next failed request, that's too many. 11612d1661a5SPawel Jakub Dawidek */ 11622d1661a5SPawel Jakub Dawidek if (pbp->bio_error == 0) 1163f5a2f7feSPawel Jakub Dawidek pbp->bio_error = fbp->bio_error; 11642d1661a5SPawel Jakub Dawidek } 11653aae74ecSPawel Jakub Dawidek disk = cbp->bio_caller2; 11663aae74ecSPawel Jakub Dawidek if (disk == NULL) 11673aae74ecSPawel Jakub Dawidek continue; 11683aae74ecSPawel Jakub Dawidek if ((disk->d_flags & G_RAID3_DISK_FLAG_BROKEN) == 0) { 11693aae74ecSPawel Jakub Dawidek disk->d_flags |= G_RAID3_DISK_FLAG_BROKEN; 11703aae74ecSPawel Jakub Dawidek G_RAID3_LOGREQ(0, cbp, "Request failed (error=%d).", 11713aae74ecSPawel Jakub Dawidek cbp->bio_error); 11723aae74ecSPawel Jakub Dawidek } else { 11733aae74ecSPawel Jakub Dawidek G_RAID3_LOGREQ(1, cbp, "Request failed (error=%d).", 11743aae74ecSPawel Jakub Dawidek cbp->bio_error); 11753aae74ecSPawel Jakub Dawidek } 11763aae74ecSPawel Jakub Dawidek if (g_raid3_disconnect_on_failure && 11773aae74ecSPawel Jakub Dawidek sc->sc_state == G_RAID3_DEVICE_STATE_COMPLETE) { 11783aae74ecSPawel Jakub Dawidek sc->sc_bump_id |= G_RAID3_BUMP_GENID; 11793aae74ecSPawel Jakub Dawidek g_raid3_event_send(disk, 11803aae74ecSPawel Jakub Dawidek G_RAID3_DISK_STATE_DISCONNECTED, 11813aae74ecSPawel Jakub Dawidek G_RAID3_EVENT_DONTWAIT); 11823aae74ecSPawel Jakub Dawidek } 11832d1661a5SPawel Jakub Dawidek } 11842d1661a5SPawel Jakub Dawidek if (pbp->bio_error != 0) 11852d1661a5SPawel Jakub Dawidek goto finish; 1186dba915cfSPawel Jakub Dawidek if (fbp != NULL && (pbp->bio_pflags & G_RAID3_BIO_PFLAG_VERIFY) != 0) { 1187dba915cfSPawel Jakub Dawidek pbp->bio_pflags &= ~G_RAID3_BIO_PFLAG_VERIFY; 1188dba915cfSPawel Jakub Dawidek if (xbp != fbp) 1189dba915cfSPawel Jakub Dawidek g_raid3_replace_bio(xbp, fbp); 1190dba915cfSPawel Jakub Dawidek g_raid3_destroy_bio(sc, fbp); 1191dba915cfSPawel Jakub Dawidek } else if (fbp != NULL) { 11922d1661a5SPawel Jakub Dawidek struct g_consumer *cp; 11932d1661a5SPawel Jakub Dawidek 11942d1661a5SPawel Jakub Dawidek /* 11952d1661a5SPawel Jakub Dawidek * One request failed, so send the same request to 11962d1661a5SPawel Jakub Dawidek * the parity consumer. 11972d1661a5SPawel Jakub Dawidek */ 1198f5a2f7feSPawel Jakub Dawidek disk = pbp->bio_driver2; 11992d1661a5SPawel Jakub Dawidek if (disk->d_state != G_RAID3_DISK_STATE_ACTIVE) { 1200f5a2f7feSPawel Jakub Dawidek pbp->bio_error = fbp->bio_error; 12012d1661a5SPawel Jakub Dawidek goto finish; 12022d1661a5SPawel Jakub Dawidek } 12032d1661a5SPawel Jakub Dawidek pbp->bio_pflags |= G_RAID3_BIO_PFLAG_DEGRADED; 12042d1661a5SPawel Jakub Dawidek pbp->bio_inbed--; 1205f5a2f7feSPawel Jakub Dawidek fbp->bio_flags &= ~(BIO_DONE | BIO_ERROR); 1206f5a2f7feSPawel Jakub Dawidek if (disk->d_no == sc->sc_ndisks - 1) 1207f5a2f7feSPawel Jakub Dawidek fbp->bio_cflags |= G_RAID3_BIO_CFLAG_PARITY; 1208f5a2f7feSPawel Jakub Dawidek fbp->bio_error = 0; 1209f5a2f7feSPawel Jakub Dawidek fbp->bio_completed = 0; 1210f5a2f7feSPawel Jakub Dawidek fbp->bio_children = 0; 1211f5a2f7feSPawel Jakub Dawidek fbp->bio_inbed = 0; 12122d1661a5SPawel Jakub Dawidek cp = disk->d_consumer; 1213f5a2f7feSPawel Jakub Dawidek fbp->bio_caller2 = disk; 1214f5a2f7feSPawel Jakub Dawidek fbp->bio_to = cp->provider; 1215f5a2f7feSPawel Jakub Dawidek G_RAID3_LOGREQ(3, fbp, "Sending request (recover)."); 12163650be51SPawel Jakub Dawidek KASSERT(cp->acr >= 1 && cp->acw >= 1 && cp->ace >= 1, 12172d1661a5SPawel Jakub Dawidek ("Consumer %s not opened (r%dw%de%d).", cp->provider->name, 12182d1661a5SPawel Jakub Dawidek cp->acr, cp->acw, cp->ace)); 121979e61493SPawel Jakub Dawidek cp->index++; 1220f5a2f7feSPawel Jakub Dawidek g_io_request(fbp, cp); 12212d1661a5SPawel Jakub Dawidek return; 12222d1661a5SPawel Jakub Dawidek } 1223f5a2f7feSPawel Jakub Dawidek if (xbp != NULL) { 1224f5a2f7feSPawel Jakub Dawidek /* 1225f5a2f7feSPawel Jakub Dawidek * Calculate parity. 1226f5a2f7feSPawel Jakub Dawidek */ 1227f5a2f7feSPawel Jakub Dawidek G_RAID3_FOREACH_BIO(pbp, cbp) { 1228f5a2f7feSPawel Jakub Dawidek if ((cbp->bio_cflags & G_RAID3_BIO_CFLAG_PARITY) != 0) 1229f5a2f7feSPawel Jakub Dawidek continue; 123006b215fdSAlexander Motin g_raid3_xor(cbp->bio_data, xbp->bio_data, 1231f5a2f7feSPawel Jakub Dawidek xbp->bio_length); 1232f5a2f7feSPawel Jakub Dawidek } 1233f5a2f7feSPawel Jakub Dawidek xbp->bio_cflags &= ~G_RAID3_BIO_CFLAG_PARITY; 1234dba915cfSPawel Jakub Dawidek if ((pbp->bio_pflags & G_RAID3_BIO_PFLAG_VERIFY) != 0) { 1235dba915cfSPawel Jakub Dawidek if (!g_raid3_is_zero(xbp)) { 1236dba915cfSPawel Jakub Dawidek g_raid3_parity_mismatch++; 1237dba915cfSPawel Jakub Dawidek pbp->bio_error = EIO; 1238dba915cfSPawel Jakub Dawidek goto finish; 1239dba915cfSPawel Jakub Dawidek } 1240dba915cfSPawel Jakub Dawidek g_raid3_destroy_bio(sc, xbp); 1241dba915cfSPawel Jakub Dawidek } 12422d1661a5SPawel Jakub Dawidek } 12432d1661a5SPawel Jakub Dawidek atom = sc->sc_sectorsize / (sc->sc_ndisks - 1); 12442d1661a5SPawel Jakub Dawidek cadd = padd = 0; 12452d1661a5SPawel Jakub Dawidek for (left = pbp->bio_length; left > 0; left -= sc->sc_sectorsize) { 12462d1661a5SPawel Jakub Dawidek G_RAID3_FOREACH_BIO(pbp, cbp) { 12472d1661a5SPawel Jakub Dawidek bcopy(cbp->bio_data + cadd, pbp->bio_data + padd, atom); 12482d1661a5SPawel Jakub Dawidek pbp->bio_completed += atom; 12492d1661a5SPawel Jakub Dawidek padd += atom; 12502d1661a5SPawel Jakub Dawidek } 12512d1661a5SPawel Jakub Dawidek cadd += atom; 12522d1661a5SPawel Jakub Dawidek } 12532d1661a5SPawel Jakub Dawidek finish: 12542d1661a5SPawel Jakub Dawidek if (pbp->bio_error == 0) 12552d1661a5SPawel Jakub Dawidek G_RAID3_LOGREQ(3, pbp, "Request finished."); 12564cf67afeSPawel Jakub Dawidek else { 12574cf67afeSPawel Jakub Dawidek if ((pbp->bio_pflags & G_RAID3_BIO_PFLAG_VERIFY) != 0) 12584cf67afeSPawel Jakub Dawidek G_RAID3_LOGREQ(1, pbp, "Verification error."); 12592d1661a5SPawel Jakub Dawidek else 12602d1661a5SPawel Jakub Dawidek G_RAID3_LOGREQ(0, pbp, "Request failed."); 12614cf67afeSPawel Jakub Dawidek } 1262dba915cfSPawel Jakub Dawidek pbp->bio_pflags &= ~G_RAID3_BIO_PFLAG_MASK; 12632d1661a5SPawel Jakub Dawidek while ((cbp = G_RAID3_HEAD_BIO(pbp)) != NULL) 12642d1661a5SPawel Jakub Dawidek g_raid3_destroy_bio(sc, cbp); 1265290c6161SPawel Jakub Dawidek g_io_deliver(pbp, pbp->bio_error); 12662d1661a5SPawel Jakub Dawidek } 12672d1661a5SPawel Jakub Dawidek 12682d1661a5SPawel Jakub Dawidek static void 12692d1661a5SPawel Jakub Dawidek g_raid3_done(struct bio *bp) 12702d1661a5SPawel Jakub Dawidek { 12712d1661a5SPawel Jakub Dawidek struct g_raid3_softc *sc; 12722d1661a5SPawel Jakub Dawidek 12732d1661a5SPawel Jakub Dawidek sc = bp->bio_from->geom->softc; 12742d1661a5SPawel Jakub Dawidek bp->bio_cflags |= G_RAID3_BIO_CFLAG_REGULAR; 12752d1661a5SPawel Jakub Dawidek G_RAID3_LOGREQ(3, bp, "Regular request done (error=%d).", bp->bio_error); 12762d1661a5SPawel Jakub Dawidek mtx_lock(&sc->sc_queue_mtx); 12772d1661a5SPawel Jakub Dawidek bioq_insert_head(&sc->sc_queue, bp); 12788de58113SAlexander Motin mtx_unlock(&sc->sc_queue_mtx); 12792d1661a5SPawel Jakub Dawidek wakeup(sc); 12802d1661a5SPawel Jakub Dawidek wakeup(&sc->sc_queue); 12812d1661a5SPawel Jakub Dawidek } 12822d1661a5SPawel Jakub Dawidek 12832d1661a5SPawel Jakub Dawidek static void 12842d1661a5SPawel Jakub Dawidek g_raid3_regular_request(struct bio *cbp) 12852d1661a5SPawel Jakub Dawidek { 12862d1661a5SPawel Jakub Dawidek struct g_raid3_softc *sc; 12872d1661a5SPawel Jakub Dawidek struct g_raid3_disk *disk; 12882d1661a5SPawel Jakub Dawidek struct bio *pbp; 12892d1661a5SPawel Jakub Dawidek 12902d1661a5SPawel Jakub Dawidek g_topology_assert_not(); 12912d1661a5SPawel Jakub Dawidek 12922d1661a5SPawel Jakub Dawidek pbp = cbp->bio_parent; 12932d1661a5SPawel Jakub Dawidek sc = pbp->bio_to->geom->softc; 12940962f942SPawel Jakub Dawidek cbp->bio_from->index--; 12950962f942SPawel Jakub Dawidek if (cbp->bio_cmd == BIO_WRITE) 12960962f942SPawel Jakub Dawidek sc->sc_writes--; 12972d1661a5SPawel Jakub Dawidek disk = cbp->bio_from->private; 12982d1661a5SPawel Jakub Dawidek if (disk == NULL) { 12992d1661a5SPawel Jakub Dawidek g_topology_lock(); 13002d1661a5SPawel Jakub Dawidek g_raid3_kill_consumer(sc, cbp->bio_from); 13012d1661a5SPawel Jakub Dawidek g_topology_unlock(); 13022d1661a5SPawel Jakub Dawidek } 13032d1661a5SPawel Jakub Dawidek 13042d1661a5SPawel Jakub Dawidek G_RAID3_LOGREQ(3, cbp, "Request finished."); 13052d1661a5SPawel Jakub Dawidek pbp->bio_inbed++; 13062d1661a5SPawel Jakub Dawidek KASSERT(pbp->bio_inbed <= pbp->bio_children, 13072d1661a5SPawel Jakub Dawidek ("bio_inbed (%u) is bigger than bio_children (%u).", pbp->bio_inbed, 13082d1661a5SPawel Jakub Dawidek pbp->bio_children)); 13092d1661a5SPawel Jakub Dawidek if (pbp->bio_inbed != pbp->bio_children) 13102d1661a5SPawel Jakub Dawidek return; 13112d1661a5SPawel Jakub Dawidek switch (pbp->bio_cmd) { 13122d1661a5SPawel Jakub Dawidek case BIO_READ: 13132d1661a5SPawel Jakub Dawidek g_raid3_gather(pbp); 13142d1661a5SPawel Jakub Dawidek break; 13152d1661a5SPawel Jakub Dawidek case BIO_WRITE: 13162d1661a5SPawel Jakub Dawidek case BIO_DELETE: 13172d1661a5SPawel Jakub Dawidek { 13182d1661a5SPawel Jakub Dawidek int error = 0; 13192d1661a5SPawel Jakub Dawidek 13202d1661a5SPawel Jakub Dawidek pbp->bio_completed = pbp->bio_length; 13212d1661a5SPawel Jakub Dawidek while ((cbp = G_RAID3_HEAD_BIO(pbp)) != NULL) { 13223aae74ecSPawel Jakub Dawidek if (cbp->bio_error == 0) { 13233aae74ecSPawel Jakub Dawidek g_raid3_destroy_bio(sc, cbp); 13243aae74ecSPawel Jakub Dawidek continue; 13252d1661a5SPawel Jakub Dawidek } 13263aae74ecSPawel Jakub Dawidek 13272d1661a5SPawel Jakub Dawidek if (error == 0) 13282d1661a5SPawel Jakub Dawidek error = cbp->bio_error; 13292d1661a5SPawel Jakub Dawidek else if (pbp->bio_error == 0) { 13302d1661a5SPawel Jakub Dawidek /* 13312d1661a5SPawel Jakub Dawidek * Next failed request, that's too many. 13322d1661a5SPawel Jakub Dawidek */ 13332d1661a5SPawel Jakub Dawidek pbp->bio_error = error; 13342d1661a5SPawel Jakub Dawidek } 13353aae74ecSPawel Jakub Dawidek 13363aae74ecSPawel Jakub Dawidek disk = cbp->bio_caller2; 13373aae74ecSPawel Jakub Dawidek if (disk == NULL) { 13383aae74ecSPawel Jakub Dawidek g_raid3_destroy_bio(sc, cbp); 13393aae74ecSPawel Jakub Dawidek continue; 13403aae74ecSPawel Jakub Dawidek } 13413aae74ecSPawel Jakub Dawidek 13423aae74ecSPawel Jakub Dawidek if ((disk->d_flags & G_RAID3_DISK_FLAG_BROKEN) == 0) { 13433aae74ecSPawel Jakub Dawidek disk->d_flags |= G_RAID3_DISK_FLAG_BROKEN; 13443aae74ecSPawel Jakub Dawidek G_RAID3_LOGREQ(0, cbp, 13453aae74ecSPawel Jakub Dawidek "Request failed (error=%d).", 13463aae74ecSPawel Jakub Dawidek cbp->bio_error); 13473aae74ecSPawel Jakub Dawidek } else { 13483aae74ecSPawel Jakub Dawidek G_RAID3_LOGREQ(1, cbp, 13493aae74ecSPawel Jakub Dawidek "Request failed (error=%d).", 13503aae74ecSPawel Jakub Dawidek cbp->bio_error); 13513aae74ecSPawel Jakub Dawidek } 13523aae74ecSPawel Jakub Dawidek if (g_raid3_disconnect_on_failure && 13533aae74ecSPawel Jakub Dawidek sc->sc_state == G_RAID3_DEVICE_STATE_COMPLETE) { 13543aae74ecSPawel Jakub Dawidek sc->sc_bump_id |= G_RAID3_BUMP_GENID; 13553aae74ecSPawel Jakub Dawidek g_raid3_event_send(disk, 13563aae74ecSPawel Jakub Dawidek G_RAID3_DISK_STATE_DISCONNECTED, 13573aae74ecSPawel Jakub Dawidek G_RAID3_EVENT_DONTWAIT); 13582d1661a5SPawel Jakub Dawidek } 13592d1661a5SPawel Jakub Dawidek g_raid3_destroy_bio(sc, cbp); 13602d1661a5SPawel Jakub Dawidek } 13612d1661a5SPawel Jakub Dawidek if (pbp->bio_error == 0) 13622d1661a5SPawel Jakub Dawidek G_RAID3_LOGREQ(3, pbp, "Request finished."); 13632d1661a5SPawel Jakub Dawidek else 13642d1661a5SPawel Jakub Dawidek G_RAID3_LOGREQ(0, pbp, "Request failed."); 13652d1661a5SPawel Jakub Dawidek pbp->bio_pflags &= ~G_RAID3_BIO_PFLAG_DEGRADED; 13662d1661a5SPawel Jakub Dawidek pbp->bio_pflags &= ~G_RAID3_BIO_PFLAG_NOPARITY; 13673650be51SPawel Jakub Dawidek bioq_remove(&sc->sc_inflight, pbp); 13683650be51SPawel Jakub Dawidek /* Release delayed sync requests if possible. */ 13693650be51SPawel Jakub Dawidek g_raid3_sync_release(sc); 13702d1661a5SPawel Jakub Dawidek g_io_deliver(pbp, pbp->bio_error); 13712d1661a5SPawel Jakub Dawidek break; 13722d1661a5SPawel Jakub Dawidek } 13732d1661a5SPawel Jakub Dawidek } 13742d1661a5SPawel Jakub Dawidek } 13752d1661a5SPawel Jakub Dawidek 13762d1661a5SPawel Jakub Dawidek static void 13772d1661a5SPawel Jakub Dawidek g_raid3_sync_done(struct bio *bp) 13782d1661a5SPawel Jakub Dawidek { 13792d1661a5SPawel Jakub Dawidek struct g_raid3_softc *sc; 13802d1661a5SPawel Jakub Dawidek 13812d1661a5SPawel Jakub Dawidek G_RAID3_LOGREQ(3, bp, "Synchronization request delivered."); 13822d1661a5SPawel Jakub Dawidek sc = bp->bio_from->geom->softc; 13832d1661a5SPawel Jakub Dawidek bp->bio_cflags |= G_RAID3_BIO_CFLAG_SYNC; 13842d1661a5SPawel Jakub Dawidek mtx_lock(&sc->sc_queue_mtx); 13852d1661a5SPawel Jakub Dawidek bioq_insert_head(&sc->sc_queue, bp); 13868de58113SAlexander Motin mtx_unlock(&sc->sc_queue_mtx); 13872d1661a5SPawel Jakub Dawidek wakeup(sc); 13882d1661a5SPawel Jakub Dawidek wakeup(&sc->sc_queue); 13892d1661a5SPawel Jakub Dawidek } 13902d1661a5SPawel Jakub Dawidek 13912d1661a5SPawel Jakub Dawidek static void 139242461fbaSPawel Jakub Dawidek g_raid3_flush(struct g_raid3_softc *sc, struct bio *bp) 139342461fbaSPawel Jakub Dawidek { 139442461fbaSPawel Jakub Dawidek struct bio_queue_head queue; 139542461fbaSPawel Jakub Dawidek struct g_raid3_disk *disk; 139642461fbaSPawel Jakub Dawidek struct g_consumer *cp; 139742461fbaSPawel Jakub Dawidek struct bio *cbp; 139842461fbaSPawel Jakub Dawidek u_int i; 139942461fbaSPawel Jakub Dawidek 140042461fbaSPawel Jakub Dawidek bioq_init(&queue); 140142461fbaSPawel Jakub Dawidek for (i = 0; i < sc->sc_ndisks; i++) { 140242461fbaSPawel Jakub Dawidek disk = &sc->sc_disks[i]; 140342461fbaSPawel Jakub Dawidek if (disk->d_state != G_RAID3_DISK_STATE_ACTIVE) 140442461fbaSPawel Jakub Dawidek continue; 140542461fbaSPawel Jakub Dawidek cbp = g_clone_bio(bp); 140642461fbaSPawel Jakub Dawidek if (cbp == NULL) { 140742461fbaSPawel Jakub Dawidek for (cbp = bioq_first(&queue); cbp != NULL; 140842461fbaSPawel Jakub Dawidek cbp = bioq_first(&queue)) { 140942461fbaSPawel Jakub Dawidek bioq_remove(&queue, cbp); 141042461fbaSPawel Jakub Dawidek g_destroy_bio(cbp); 141142461fbaSPawel Jakub Dawidek } 141242461fbaSPawel Jakub Dawidek if (bp->bio_error == 0) 141342461fbaSPawel Jakub Dawidek bp->bio_error = ENOMEM; 141442461fbaSPawel Jakub Dawidek g_io_deliver(bp, bp->bio_error); 141542461fbaSPawel Jakub Dawidek return; 141642461fbaSPawel Jakub Dawidek } 141742461fbaSPawel Jakub Dawidek bioq_insert_tail(&queue, cbp); 141842461fbaSPawel Jakub Dawidek cbp->bio_done = g_std_done; 141942461fbaSPawel Jakub Dawidek cbp->bio_caller1 = disk; 142042461fbaSPawel Jakub Dawidek cbp->bio_to = disk->d_consumer->provider; 142142461fbaSPawel Jakub Dawidek } 142242461fbaSPawel Jakub Dawidek for (cbp = bioq_first(&queue); cbp != NULL; cbp = bioq_first(&queue)) { 142342461fbaSPawel Jakub Dawidek bioq_remove(&queue, cbp); 142442461fbaSPawel Jakub Dawidek G_RAID3_LOGREQ(3, cbp, "Sending request."); 142542461fbaSPawel Jakub Dawidek disk = cbp->bio_caller1; 142642461fbaSPawel Jakub Dawidek cbp->bio_caller1 = NULL; 142742461fbaSPawel Jakub Dawidek cp = disk->d_consumer; 142842461fbaSPawel Jakub Dawidek KASSERT(cp->acr >= 1 && cp->acw >= 1 && cp->ace >= 1, 142942461fbaSPawel Jakub Dawidek ("Consumer %s not opened (r%dw%de%d).", cp->provider->name, 143042461fbaSPawel Jakub Dawidek cp->acr, cp->acw, cp->ace)); 143142461fbaSPawel Jakub Dawidek g_io_request(cbp, disk->d_consumer); 143242461fbaSPawel Jakub Dawidek } 143342461fbaSPawel Jakub Dawidek } 143442461fbaSPawel Jakub Dawidek 143542461fbaSPawel Jakub Dawidek static void 14362d1661a5SPawel Jakub Dawidek g_raid3_start(struct bio *bp) 14372d1661a5SPawel Jakub Dawidek { 14382d1661a5SPawel Jakub Dawidek struct g_raid3_softc *sc; 14392d1661a5SPawel Jakub Dawidek 14402d1661a5SPawel Jakub Dawidek sc = bp->bio_to->geom->softc; 14412d1661a5SPawel Jakub Dawidek /* 14422d1661a5SPawel Jakub Dawidek * If sc == NULL or there are no valid disks, provider's error 14432d1661a5SPawel Jakub Dawidek * should be set and g_raid3_start() should not be called at all. 14442d1661a5SPawel Jakub Dawidek */ 14452d1661a5SPawel Jakub Dawidek KASSERT(sc != NULL && (sc->sc_state == G_RAID3_DEVICE_STATE_DEGRADED || 14462d1661a5SPawel Jakub Dawidek sc->sc_state == G_RAID3_DEVICE_STATE_COMPLETE), 14472d1661a5SPawel Jakub Dawidek ("Provider's error should be set (error=%d)(device=%s).", 14482d1661a5SPawel Jakub Dawidek bp->bio_to->error, bp->bio_to->name)); 14492d1661a5SPawel Jakub Dawidek G_RAID3_LOGREQ(3, bp, "Request received."); 14502d1661a5SPawel Jakub Dawidek 14512d1661a5SPawel Jakub Dawidek switch (bp->bio_cmd) { 14522d1661a5SPawel Jakub Dawidek case BIO_READ: 14532d1661a5SPawel Jakub Dawidek case BIO_WRITE: 14542d1661a5SPawel Jakub Dawidek case BIO_DELETE: 14552d1661a5SPawel Jakub Dawidek break; 145642461fbaSPawel Jakub Dawidek case BIO_FLUSH: 145742461fbaSPawel Jakub Dawidek g_raid3_flush(sc, bp); 145842461fbaSPawel Jakub Dawidek return; 14592d1661a5SPawel Jakub Dawidek case BIO_GETATTR: 14602d1661a5SPawel Jakub Dawidek default: 14612d1661a5SPawel Jakub Dawidek g_io_deliver(bp, EOPNOTSUPP); 14622d1661a5SPawel Jakub Dawidek return; 14632d1661a5SPawel Jakub Dawidek } 14642d1661a5SPawel Jakub Dawidek mtx_lock(&sc->sc_queue_mtx); 14652d1661a5SPawel Jakub Dawidek bioq_insert_tail(&sc->sc_queue, bp); 14668de58113SAlexander Motin mtx_unlock(&sc->sc_queue_mtx); 14672d1661a5SPawel Jakub Dawidek G_RAID3_DEBUG(4, "%s: Waking up %p.", __func__, sc); 14682d1661a5SPawel Jakub Dawidek wakeup(sc); 14692d1661a5SPawel Jakub Dawidek } 14702d1661a5SPawel Jakub Dawidek 14712d1661a5SPawel Jakub Dawidek /* 14723650be51SPawel Jakub Dawidek * Return TRUE if the given request is colliding with a in-progress 14733650be51SPawel Jakub Dawidek * synchronization request. 14742d1661a5SPawel Jakub Dawidek */ 14753650be51SPawel Jakub Dawidek static int 14763650be51SPawel Jakub Dawidek g_raid3_sync_collision(struct g_raid3_softc *sc, struct bio *bp) 14772d1661a5SPawel Jakub Dawidek { 14782d1661a5SPawel Jakub Dawidek struct g_raid3_disk *disk; 14793650be51SPawel Jakub Dawidek struct bio *sbp; 14803650be51SPawel Jakub Dawidek off_t rstart, rend, sstart, send; 14813650be51SPawel Jakub Dawidek int i; 14823650be51SPawel Jakub Dawidek 14833650be51SPawel Jakub Dawidek disk = sc->sc_syncdisk; 14843650be51SPawel Jakub Dawidek if (disk == NULL) 14853650be51SPawel Jakub Dawidek return (0); 14863650be51SPawel Jakub Dawidek rstart = bp->bio_offset; 14873650be51SPawel Jakub Dawidek rend = bp->bio_offset + bp->bio_length; 14883650be51SPawel Jakub Dawidek for (i = 0; i < g_raid3_syncreqs; i++) { 14893650be51SPawel Jakub Dawidek sbp = disk->d_sync.ds_bios[i]; 14903650be51SPawel Jakub Dawidek if (sbp == NULL) 14913650be51SPawel Jakub Dawidek continue; 14923650be51SPawel Jakub Dawidek sstart = sbp->bio_offset; 14933650be51SPawel Jakub Dawidek send = sbp->bio_length; 14943650be51SPawel Jakub Dawidek if (sbp->bio_cmd == BIO_WRITE) { 14953650be51SPawel Jakub Dawidek sstart *= sc->sc_ndisks - 1; 14963650be51SPawel Jakub Dawidek send *= sc->sc_ndisks - 1; 14973650be51SPawel Jakub Dawidek } 14983650be51SPawel Jakub Dawidek send += sstart; 14993650be51SPawel Jakub Dawidek if (rend > sstart && rstart < send) 15003650be51SPawel Jakub Dawidek return (1); 15013650be51SPawel Jakub Dawidek } 15023650be51SPawel Jakub Dawidek return (0); 15033650be51SPawel Jakub Dawidek } 15043650be51SPawel Jakub Dawidek 15053650be51SPawel Jakub Dawidek /* 15063650be51SPawel Jakub Dawidek * Return TRUE if the given sync request is colliding with a in-progress regular 15073650be51SPawel Jakub Dawidek * request. 15083650be51SPawel Jakub Dawidek */ 15093650be51SPawel Jakub Dawidek static int 15103650be51SPawel Jakub Dawidek g_raid3_regular_collision(struct g_raid3_softc *sc, struct bio *sbp) 15113650be51SPawel Jakub Dawidek { 15123650be51SPawel Jakub Dawidek off_t rstart, rend, sstart, send; 15132d1661a5SPawel Jakub Dawidek struct bio *bp; 15142d1661a5SPawel Jakub Dawidek 15153650be51SPawel Jakub Dawidek if (sc->sc_syncdisk == NULL) 15163650be51SPawel Jakub Dawidek return (0); 15173650be51SPawel Jakub Dawidek sstart = sbp->bio_offset; 15183650be51SPawel Jakub Dawidek send = sstart + sbp->bio_length; 15193650be51SPawel Jakub Dawidek TAILQ_FOREACH(bp, &sc->sc_inflight.queue, bio_queue) { 15203650be51SPawel Jakub Dawidek rstart = bp->bio_offset; 15213650be51SPawel Jakub Dawidek rend = bp->bio_offset + bp->bio_length; 15223650be51SPawel Jakub Dawidek if (rend > sstart && rstart < send) 15233650be51SPawel Jakub Dawidek return (1); 15242d1661a5SPawel Jakub Dawidek } 15253650be51SPawel Jakub Dawidek return (0); 15262d1661a5SPawel Jakub Dawidek } 15272d1661a5SPawel Jakub Dawidek 15283650be51SPawel Jakub Dawidek /* 15293650be51SPawel Jakub Dawidek * Puts request onto delayed queue. 15303650be51SPawel Jakub Dawidek */ 15313650be51SPawel Jakub Dawidek static void 15323650be51SPawel Jakub Dawidek g_raid3_regular_delay(struct g_raid3_softc *sc, struct bio *bp) 15333650be51SPawel Jakub Dawidek { 15343650be51SPawel Jakub Dawidek 15353650be51SPawel Jakub Dawidek G_RAID3_LOGREQ(2, bp, "Delaying request."); 15363650be51SPawel Jakub Dawidek bioq_insert_head(&sc->sc_regular_delayed, bp); 15373650be51SPawel Jakub Dawidek } 15383650be51SPawel Jakub Dawidek 15393650be51SPawel Jakub Dawidek /* 15403650be51SPawel Jakub Dawidek * Puts synchronization request onto delayed queue. 15413650be51SPawel Jakub Dawidek */ 15423650be51SPawel Jakub Dawidek static void 15433650be51SPawel Jakub Dawidek g_raid3_sync_delay(struct g_raid3_softc *sc, struct bio *bp) 15443650be51SPawel Jakub Dawidek { 15453650be51SPawel Jakub Dawidek 15463650be51SPawel Jakub Dawidek G_RAID3_LOGREQ(2, bp, "Delaying synchronization request."); 15473650be51SPawel Jakub Dawidek bioq_insert_tail(&sc->sc_sync_delayed, bp); 15483650be51SPawel Jakub Dawidek } 15493650be51SPawel Jakub Dawidek 15503650be51SPawel Jakub Dawidek /* 15513650be51SPawel Jakub Dawidek * Releases delayed regular requests which don't collide anymore with sync 15523650be51SPawel Jakub Dawidek * requests. 15533650be51SPawel Jakub Dawidek */ 15543650be51SPawel Jakub Dawidek static void 15553650be51SPawel Jakub Dawidek g_raid3_regular_release(struct g_raid3_softc *sc) 15563650be51SPawel Jakub Dawidek { 15573650be51SPawel Jakub Dawidek struct bio *bp, *bp2; 15583650be51SPawel Jakub Dawidek 15593650be51SPawel Jakub Dawidek TAILQ_FOREACH_SAFE(bp, &sc->sc_regular_delayed.queue, bio_queue, bp2) { 15603650be51SPawel Jakub Dawidek if (g_raid3_sync_collision(sc, bp)) 15613650be51SPawel Jakub Dawidek continue; 15623650be51SPawel Jakub Dawidek bioq_remove(&sc->sc_regular_delayed, bp); 15633650be51SPawel Jakub Dawidek G_RAID3_LOGREQ(2, bp, "Releasing delayed request (%p).", bp); 15643650be51SPawel Jakub Dawidek mtx_lock(&sc->sc_queue_mtx); 15653650be51SPawel Jakub Dawidek bioq_insert_head(&sc->sc_queue, bp); 15663650be51SPawel Jakub Dawidek #if 0 15673650be51SPawel Jakub Dawidek /* 15683650be51SPawel Jakub Dawidek * wakeup() is not needed, because this function is called from 15693650be51SPawel Jakub Dawidek * the worker thread. 15703650be51SPawel Jakub Dawidek */ 15713650be51SPawel Jakub Dawidek wakeup(&sc->sc_queue); 15723650be51SPawel Jakub Dawidek #endif 15733650be51SPawel Jakub Dawidek mtx_unlock(&sc->sc_queue_mtx); 15743650be51SPawel Jakub Dawidek } 15753650be51SPawel Jakub Dawidek } 15763650be51SPawel Jakub Dawidek 15773650be51SPawel Jakub Dawidek /* 15783650be51SPawel Jakub Dawidek * Releases delayed sync requests which don't collide anymore with regular 15793650be51SPawel Jakub Dawidek * requests. 15803650be51SPawel Jakub Dawidek */ 15813650be51SPawel Jakub Dawidek static void 15823650be51SPawel Jakub Dawidek g_raid3_sync_release(struct g_raid3_softc *sc) 15833650be51SPawel Jakub Dawidek { 15843650be51SPawel Jakub Dawidek struct bio *bp, *bp2; 15853650be51SPawel Jakub Dawidek 15863650be51SPawel Jakub Dawidek TAILQ_FOREACH_SAFE(bp, &sc->sc_sync_delayed.queue, bio_queue, bp2) { 15873650be51SPawel Jakub Dawidek if (g_raid3_regular_collision(sc, bp)) 15883650be51SPawel Jakub Dawidek continue; 15893650be51SPawel Jakub Dawidek bioq_remove(&sc->sc_sync_delayed, bp); 15903650be51SPawel Jakub Dawidek G_RAID3_LOGREQ(2, bp, 15913650be51SPawel Jakub Dawidek "Releasing delayed synchronization request."); 15923650be51SPawel Jakub Dawidek g_io_request(bp, bp->bio_from); 15933650be51SPawel Jakub Dawidek } 15943650be51SPawel Jakub Dawidek } 15953650be51SPawel Jakub Dawidek 15963650be51SPawel Jakub Dawidek /* 15973650be51SPawel Jakub Dawidek * Handle synchronization requests. 15983650be51SPawel Jakub Dawidek * Every synchronization request is two-steps process: first, READ request is 15993650be51SPawel Jakub Dawidek * send to active provider and then WRITE request (with read data) to the provider 16003650be51SPawel Jakub Dawidek * beeing synchronized. When WRITE is finished, new synchronization request is 16013650be51SPawel Jakub Dawidek * send. 16023650be51SPawel Jakub Dawidek */ 16032d1661a5SPawel Jakub Dawidek static void 16042d1661a5SPawel Jakub Dawidek g_raid3_sync_request(struct bio *bp) 16052d1661a5SPawel Jakub Dawidek { 16062d1661a5SPawel Jakub Dawidek struct g_raid3_softc *sc; 16072d1661a5SPawel Jakub Dawidek struct g_raid3_disk *disk; 16082d1661a5SPawel Jakub Dawidek 160979e61493SPawel Jakub Dawidek bp->bio_from->index--; 16102d1661a5SPawel Jakub Dawidek sc = bp->bio_from->geom->softc; 16112d1661a5SPawel Jakub Dawidek disk = bp->bio_from->private; 16122d1661a5SPawel Jakub Dawidek if (disk == NULL) { 16133650be51SPawel Jakub Dawidek sx_xunlock(&sc->sc_lock); /* Avoid recursion on sc_lock. */ 16142d1661a5SPawel Jakub Dawidek g_topology_lock(); 16152d1661a5SPawel Jakub Dawidek g_raid3_kill_consumer(sc, bp->bio_from); 16162d1661a5SPawel Jakub Dawidek g_topology_unlock(); 16173650be51SPawel Jakub Dawidek free(bp->bio_data, M_RAID3); 16182d1661a5SPawel Jakub Dawidek g_destroy_bio(bp); 16193650be51SPawel Jakub Dawidek sx_xlock(&sc->sc_lock); 16202d1661a5SPawel Jakub Dawidek return; 16212d1661a5SPawel Jakub Dawidek } 16222d1661a5SPawel Jakub Dawidek 16232d1661a5SPawel Jakub Dawidek /* 16242d1661a5SPawel Jakub Dawidek * Synchronization request. 16252d1661a5SPawel Jakub Dawidek */ 16262d1661a5SPawel Jakub Dawidek switch (bp->bio_cmd) { 16272d1661a5SPawel Jakub Dawidek case BIO_READ: 16282d1661a5SPawel Jakub Dawidek { 16292d1661a5SPawel Jakub Dawidek struct g_consumer *cp; 16302d1661a5SPawel Jakub Dawidek u_char *dst, *src; 16312d1661a5SPawel Jakub Dawidek off_t left; 16322d1661a5SPawel Jakub Dawidek u_int atom; 16332d1661a5SPawel Jakub Dawidek 16342d1661a5SPawel Jakub Dawidek if (bp->bio_error != 0) { 16352d1661a5SPawel Jakub Dawidek G_RAID3_LOGREQ(0, bp, 16362d1661a5SPawel Jakub Dawidek "Synchronization request failed (error=%d).", 16372d1661a5SPawel Jakub Dawidek bp->bio_error); 16382d1661a5SPawel Jakub Dawidek g_destroy_bio(bp); 16392d1661a5SPawel Jakub Dawidek return; 16402d1661a5SPawel Jakub Dawidek } 16412d1661a5SPawel Jakub Dawidek G_RAID3_LOGREQ(3, bp, "Synchronization request finished."); 16422d1661a5SPawel Jakub Dawidek atom = sc->sc_sectorsize / (sc->sc_ndisks - 1); 16432d1661a5SPawel Jakub Dawidek dst = src = bp->bio_data; 16442d1661a5SPawel Jakub Dawidek if (disk->d_no == sc->sc_ndisks - 1) { 16452d1661a5SPawel Jakub Dawidek u_int n; 16462d1661a5SPawel Jakub Dawidek 16472d1661a5SPawel Jakub Dawidek /* Parity component. */ 16482d1661a5SPawel Jakub Dawidek for (left = bp->bio_length; left > 0; 16492d1661a5SPawel Jakub Dawidek left -= sc->sc_sectorsize) { 16502d1661a5SPawel Jakub Dawidek bcopy(src, dst, atom); 16512d1661a5SPawel Jakub Dawidek src += atom; 16522d1661a5SPawel Jakub Dawidek for (n = 1; n < sc->sc_ndisks - 1; n++) { 165306b215fdSAlexander Motin g_raid3_xor(src, dst, atom); 16542d1661a5SPawel Jakub Dawidek src += atom; 16552d1661a5SPawel Jakub Dawidek } 16562d1661a5SPawel Jakub Dawidek dst += atom; 16572d1661a5SPawel Jakub Dawidek } 16582d1661a5SPawel Jakub Dawidek } else { 16592d1661a5SPawel Jakub Dawidek /* Regular component. */ 16602d1661a5SPawel Jakub Dawidek src += atom * disk->d_no; 16612d1661a5SPawel Jakub Dawidek for (left = bp->bio_length; left > 0; 16622d1661a5SPawel Jakub Dawidek left -= sc->sc_sectorsize) { 16632d1661a5SPawel Jakub Dawidek bcopy(src, dst, atom); 16642d1661a5SPawel Jakub Dawidek src += sc->sc_sectorsize; 16652d1661a5SPawel Jakub Dawidek dst += atom; 16662d1661a5SPawel Jakub Dawidek } 16672d1661a5SPawel Jakub Dawidek } 16683650be51SPawel Jakub Dawidek bp->bio_driver1 = bp->bio_driver2 = NULL; 16693650be51SPawel Jakub Dawidek bp->bio_pflags = 0; 16702d1661a5SPawel Jakub Dawidek bp->bio_offset /= sc->sc_ndisks - 1; 16712d1661a5SPawel Jakub Dawidek bp->bio_length /= sc->sc_ndisks - 1; 16722d1661a5SPawel Jakub Dawidek bp->bio_cmd = BIO_WRITE; 16732d1661a5SPawel Jakub Dawidek bp->bio_cflags = 0; 16742d1661a5SPawel Jakub Dawidek bp->bio_children = bp->bio_inbed = 0; 16752d1661a5SPawel Jakub Dawidek cp = disk->d_consumer; 16763650be51SPawel Jakub Dawidek KASSERT(cp->acr >= 1 && cp->acw >= 1 && cp->ace >= 1, 16772d1661a5SPawel Jakub Dawidek ("Consumer %s not opened (r%dw%de%d).", cp->provider->name, 16782d1661a5SPawel Jakub Dawidek cp->acr, cp->acw, cp->ace)); 167979e61493SPawel Jakub Dawidek cp->index++; 16802d1661a5SPawel Jakub Dawidek g_io_request(bp, cp); 16812d1661a5SPawel Jakub Dawidek return; 16822d1661a5SPawel Jakub Dawidek } 16832d1661a5SPawel Jakub Dawidek case BIO_WRITE: 1684d2fb9c62SPawel Jakub Dawidek { 1685d2fb9c62SPawel Jakub Dawidek struct g_raid3_disk_sync *sync; 16863650be51SPawel Jakub Dawidek off_t boffset, moffset; 16873650be51SPawel Jakub Dawidek void *data; 16883650be51SPawel Jakub Dawidek int i; 1689d2fb9c62SPawel Jakub Dawidek 16902d1661a5SPawel Jakub Dawidek if (bp->bio_error != 0) { 16912d1661a5SPawel Jakub Dawidek G_RAID3_LOGREQ(0, bp, 16922d1661a5SPawel Jakub Dawidek "Synchronization request failed (error=%d).", 16932d1661a5SPawel Jakub Dawidek bp->bio_error); 16942d1661a5SPawel Jakub Dawidek g_destroy_bio(bp); 1695ea973705SPawel Jakub Dawidek sc->sc_bump_id |= G_RAID3_BUMP_GENID; 16962d1661a5SPawel Jakub Dawidek g_raid3_event_send(disk, 16972d1661a5SPawel Jakub Dawidek G_RAID3_DISK_STATE_DISCONNECTED, 16982d1661a5SPawel Jakub Dawidek G_RAID3_EVENT_DONTWAIT); 16992d1661a5SPawel Jakub Dawidek return; 17002d1661a5SPawel Jakub Dawidek } 17012d1661a5SPawel Jakub Dawidek G_RAID3_LOGREQ(3, bp, "Synchronization request finished."); 1702d2fb9c62SPawel Jakub Dawidek sync = &disk->d_sync; 17033650be51SPawel Jakub Dawidek if (sync->ds_offset == sc->sc_mediasize / (sc->sc_ndisks - 1) || 17043650be51SPawel Jakub Dawidek sync->ds_consumer == NULL || 17053650be51SPawel Jakub Dawidek (sc->sc_flags & G_RAID3_DEVICE_FLAG_DESTROY) != 0) { 17063650be51SPawel Jakub Dawidek /* Don't send more synchronization requests. */ 17073650be51SPawel Jakub Dawidek sync->ds_inflight--; 17083650be51SPawel Jakub Dawidek if (sync->ds_bios != NULL) { 1709ef25813dSRuslan Ermilov i = (int)(uintptr_t)bp->bio_caller1; 17103650be51SPawel Jakub Dawidek sync->ds_bios[i] = NULL; 17113650be51SPawel Jakub Dawidek } 17123650be51SPawel Jakub Dawidek free(bp->bio_data, M_RAID3); 17132d1661a5SPawel Jakub Dawidek g_destroy_bio(bp); 17143650be51SPawel Jakub Dawidek if (sync->ds_inflight > 0) 1715d2fb9c62SPawel Jakub Dawidek return; 17163650be51SPawel Jakub Dawidek if (sync->ds_consumer == NULL || 17173650be51SPawel Jakub Dawidek (sc->sc_flags & G_RAID3_DEVICE_FLAG_DESTROY) != 0) { 17183650be51SPawel Jakub Dawidek return; 17193650be51SPawel Jakub Dawidek } 17202d1661a5SPawel Jakub Dawidek /* 17212d1661a5SPawel Jakub Dawidek * Disk up-to-date, activate it. 17222d1661a5SPawel Jakub Dawidek */ 17232d1661a5SPawel Jakub Dawidek g_raid3_event_send(disk, G_RAID3_DISK_STATE_ACTIVE, 17242d1661a5SPawel Jakub Dawidek G_RAID3_EVENT_DONTWAIT); 17252d1661a5SPawel Jakub Dawidek return; 17263650be51SPawel Jakub Dawidek } 17273650be51SPawel Jakub Dawidek 17283650be51SPawel Jakub Dawidek /* Send next synchronization request. */ 17293650be51SPawel Jakub Dawidek data = bp->bio_data; 17303650be51SPawel Jakub Dawidek bzero(bp, sizeof(*bp)); 17313650be51SPawel Jakub Dawidek bp->bio_cmd = BIO_READ; 17323650be51SPawel Jakub Dawidek bp->bio_offset = sync->ds_offset * (sc->sc_ndisks - 1); 17333650be51SPawel Jakub Dawidek bp->bio_length = MIN(MAXPHYS, sc->sc_mediasize - bp->bio_offset); 17343650be51SPawel Jakub Dawidek sync->ds_offset += bp->bio_length / (sc->sc_ndisks - 1); 17353650be51SPawel Jakub Dawidek bp->bio_done = g_raid3_sync_done; 17363650be51SPawel Jakub Dawidek bp->bio_data = data; 17373650be51SPawel Jakub Dawidek bp->bio_from = sync->ds_consumer; 17383650be51SPawel Jakub Dawidek bp->bio_to = sc->sc_provider; 17393650be51SPawel Jakub Dawidek G_RAID3_LOGREQ(3, bp, "Sending synchronization request."); 17403650be51SPawel Jakub Dawidek sync->ds_consumer->index++; 17412d1661a5SPawel Jakub Dawidek /* 17423650be51SPawel Jakub Dawidek * Delay the request if it is colliding with a regular request. 17432d1661a5SPawel Jakub Dawidek */ 17443650be51SPawel Jakub Dawidek if (g_raid3_regular_collision(sc, bp)) 17453650be51SPawel Jakub Dawidek g_raid3_sync_delay(sc, bp); 17463650be51SPawel Jakub Dawidek else 17473650be51SPawel Jakub Dawidek g_io_request(bp, sync->ds_consumer); 17483650be51SPawel Jakub Dawidek 17493650be51SPawel Jakub Dawidek /* Release delayed requests if possible. */ 17503650be51SPawel Jakub Dawidek g_raid3_regular_release(sc); 17513650be51SPawel Jakub Dawidek 17523650be51SPawel Jakub Dawidek /* Find the smallest offset. */ 17533650be51SPawel Jakub Dawidek moffset = sc->sc_mediasize; 17543650be51SPawel Jakub Dawidek for (i = 0; i < g_raid3_syncreqs; i++) { 17553650be51SPawel Jakub Dawidek bp = sync->ds_bios[i]; 17563650be51SPawel Jakub Dawidek boffset = bp->bio_offset; 17573650be51SPawel Jakub Dawidek if (bp->bio_cmd == BIO_WRITE) 17583650be51SPawel Jakub Dawidek boffset *= sc->sc_ndisks - 1; 17593650be51SPawel Jakub Dawidek if (boffset < moffset) 17603650be51SPawel Jakub Dawidek moffset = boffset; 17613650be51SPawel Jakub Dawidek } 17623650be51SPawel Jakub Dawidek if (sync->ds_offset_done + (MAXPHYS * 100) < moffset) { 17633650be51SPawel Jakub Dawidek /* Update offset_done on every 100 blocks. */ 17643650be51SPawel Jakub Dawidek sync->ds_offset_done = moffset; 17652d1661a5SPawel Jakub Dawidek g_raid3_update_metadata(disk); 17662d1661a5SPawel Jakub Dawidek } 17672d1661a5SPawel Jakub Dawidek return; 1768d2fb9c62SPawel Jakub Dawidek } 17692d1661a5SPawel Jakub Dawidek default: 17702d1661a5SPawel Jakub Dawidek KASSERT(1 == 0, ("Invalid command here: %u (device=%s)", 17712d1661a5SPawel Jakub Dawidek bp->bio_cmd, sc->sc_name)); 17722d1661a5SPawel Jakub Dawidek break; 17732d1661a5SPawel Jakub Dawidek } 17742d1661a5SPawel Jakub Dawidek } 17752d1661a5SPawel Jakub Dawidek 17762d1661a5SPawel Jakub Dawidek static int 17772d1661a5SPawel Jakub Dawidek g_raid3_register_request(struct bio *pbp) 17782d1661a5SPawel Jakub Dawidek { 17792d1661a5SPawel Jakub Dawidek struct g_raid3_softc *sc; 17802d1661a5SPawel Jakub Dawidek struct g_raid3_disk *disk; 17812d1661a5SPawel Jakub Dawidek struct g_consumer *cp; 1782ee40c7aaSPawel Jakub Dawidek struct bio *cbp, *tmpbp; 17832d1661a5SPawel Jakub Dawidek off_t offset, length; 1784fa6a7837SDavid E. O'Brien u_int n, ndisks; 1785dba915cfSPawel Jakub Dawidek int round_robin, verify; 17862d1661a5SPawel Jakub Dawidek 1787fa6a7837SDavid E. O'Brien ndisks = 0; 17882d1661a5SPawel Jakub Dawidek sc = pbp->bio_to->geom->softc; 17892d1661a5SPawel Jakub Dawidek if ((pbp->bio_cflags & G_RAID3_BIO_CFLAG_REGSYNC) != 0 && 17902d1661a5SPawel Jakub Dawidek sc->sc_syncdisk == NULL) { 17912d1661a5SPawel Jakub Dawidek g_io_deliver(pbp, EIO); 17922d1661a5SPawel Jakub Dawidek return (0); 17932d1661a5SPawel Jakub Dawidek } 17942d1661a5SPawel Jakub Dawidek g_raid3_init_bio(pbp); 17952d1661a5SPawel Jakub Dawidek length = pbp->bio_length / (sc->sc_ndisks - 1); 17962d1661a5SPawel Jakub Dawidek offset = pbp->bio_offset / (sc->sc_ndisks - 1); 1797dba915cfSPawel Jakub Dawidek round_robin = verify = 0; 17982d1661a5SPawel Jakub Dawidek switch (pbp->bio_cmd) { 17992d1661a5SPawel Jakub Dawidek case BIO_READ: 1800dba915cfSPawel Jakub Dawidek if ((sc->sc_flags & G_RAID3_DEVICE_FLAG_VERIFY) != 0 && 1801dba915cfSPawel Jakub Dawidek sc->sc_state == G_RAID3_DEVICE_STATE_COMPLETE) { 1802dba915cfSPawel Jakub Dawidek pbp->bio_pflags |= G_RAID3_BIO_PFLAG_VERIFY; 1803dba915cfSPawel Jakub Dawidek verify = 1; 1804dba915cfSPawel Jakub Dawidek ndisks = sc->sc_ndisks; 1805dba915cfSPawel Jakub Dawidek } else { 1806dba915cfSPawel Jakub Dawidek verify = 0; 18072d1661a5SPawel Jakub Dawidek ndisks = sc->sc_ndisks - 1; 1808dba915cfSPawel Jakub Dawidek } 1809dba915cfSPawel Jakub Dawidek if ((sc->sc_flags & G_RAID3_DEVICE_FLAG_ROUND_ROBIN) != 0 && 1810dba915cfSPawel Jakub Dawidek sc->sc_state == G_RAID3_DEVICE_STATE_COMPLETE) { 1811dba915cfSPawel Jakub Dawidek round_robin = 1; 1812dba915cfSPawel Jakub Dawidek } else { 1813dba915cfSPawel Jakub Dawidek round_robin = 0; 1814dba915cfSPawel Jakub Dawidek } 1815dba915cfSPawel Jakub Dawidek KASSERT(!round_robin || !verify, 1816dba915cfSPawel Jakub Dawidek ("ROUND-ROBIN and VERIFY are mutually exclusive.")); 1817f5a2f7feSPawel Jakub Dawidek pbp->bio_driver2 = &sc->sc_disks[sc->sc_ndisks - 1]; 18182d1661a5SPawel Jakub Dawidek break; 18192d1661a5SPawel Jakub Dawidek case BIO_WRITE: 18202d1661a5SPawel Jakub Dawidek case BIO_DELETE: 18213650be51SPawel Jakub Dawidek /* 18223650be51SPawel Jakub Dawidek * Delay the request if it is colliding with a synchronization 18233650be51SPawel Jakub Dawidek * request. 18243650be51SPawel Jakub Dawidek */ 18253650be51SPawel Jakub Dawidek if (g_raid3_sync_collision(sc, pbp)) { 18263650be51SPawel Jakub Dawidek g_raid3_regular_delay(sc, pbp); 18273650be51SPawel Jakub Dawidek return (0); 18283650be51SPawel Jakub Dawidek } 1829d2fb9c62SPawel Jakub Dawidek 18304d006a98SPawel Jakub Dawidek if (sc->sc_idle) 18314d006a98SPawel Jakub Dawidek g_raid3_unidle(sc); 18320962f942SPawel Jakub Dawidek else 183301f1f41cSPawel Jakub Dawidek sc->sc_last_write = time_uptime; 18344d006a98SPawel Jakub Dawidek 18352d1661a5SPawel Jakub Dawidek ndisks = sc->sc_ndisks; 18362d1661a5SPawel Jakub Dawidek break; 18372d1661a5SPawel Jakub Dawidek } 18382d1661a5SPawel Jakub Dawidek for (n = 0; n < ndisks; n++) { 18392d1661a5SPawel Jakub Dawidek disk = &sc->sc_disks[n]; 18402d1661a5SPawel Jakub Dawidek cbp = g_raid3_clone_bio(sc, pbp); 18412d1661a5SPawel Jakub Dawidek if (cbp == NULL) { 18422d1661a5SPawel Jakub Dawidek while ((cbp = G_RAID3_HEAD_BIO(pbp)) != NULL) 18432d1661a5SPawel Jakub Dawidek g_raid3_destroy_bio(sc, cbp); 1844a65a0da2SPawel Jakub Dawidek /* 1845a65a0da2SPawel Jakub Dawidek * To prevent deadlock, we must run back up 1846a65a0da2SPawel Jakub Dawidek * with the ENOMEM for failed requests of any 1847a65a0da2SPawel Jakub Dawidek * of our consumers. Our own sync requests 1848a65a0da2SPawel Jakub Dawidek * can stick around, as they are finite. 1849a65a0da2SPawel Jakub Dawidek */ 1850a65a0da2SPawel Jakub Dawidek if ((pbp->bio_cflags & 1851a65a0da2SPawel Jakub Dawidek G_RAID3_BIO_CFLAG_REGULAR) != 0) { 1852a65a0da2SPawel Jakub Dawidek g_io_deliver(pbp, ENOMEM); 1853a65a0da2SPawel Jakub Dawidek return (0); 1854a65a0da2SPawel Jakub Dawidek } 18552d1661a5SPawel Jakub Dawidek return (ENOMEM); 18562d1661a5SPawel Jakub Dawidek } 18572d1661a5SPawel Jakub Dawidek cbp->bio_offset = offset; 18582d1661a5SPawel Jakub Dawidek cbp->bio_length = length; 18592d1661a5SPawel Jakub Dawidek cbp->bio_done = g_raid3_done; 18602d1661a5SPawel Jakub Dawidek switch (pbp->bio_cmd) { 18612d1661a5SPawel Jakub Dawidek case BIO_READ: 18622d1661a5SPawel Jakub Dawidek if (disk->d_state != G_RAID3_DISK_STATE_ACTIVE) { 18632d1661a5SPawel Jakub Dawidek /* 18642d1661a5SPawel Jakub Dawidek * Replace invalid component with the parity 18652d1661a5SPawel Jakub Dawidek * component. 18662d1661a5SPawel Jakub Dawidek */ 18672d1661a5SPawel Jakub Dawidek disk = &sc->sc_disks[sc->sc_ndisks - 1]; 18682d1661a5SPawel Jakub Dawidek cbp->bio_cflags |= G_RAID3_BIO_CFLAG_PARITY; 18692d1661a5SPawel Jakub Dawidek pbp->bio_pflags |= G_RAID3_BIO_PFLAG_DEGRADED; 1870f5a2f7feSPawel Jakub Dawidek } else if (round_robin && 1871f5a2f7feSPawel Jakub Dawidek disk->d_no == sc->sc_round_robin) { 1872f5a2f7feSPawel Jakub Dawidek /* 1873f5a2f7feSPawel Jakub Dawidek * In round-robin mode skip one data component 1874f5a2f7feSPawel Jakub Dawidek * and use parity component when reading. 1875f5a2f7feSPawel Jakub Dawidek */ 1876f5a2f7feSPawel Jakub Dawidek pbp->bio_driver2 = disk; 1877f5a2f7feSPawel Jakub Dawidek disk = &sc->sc_disks[sc->sc_ndisks - 1]; 1878f5a2f7feSPawel Jakub Dawidek cbp->bio_cflags |= G_RAID3_BIO_CFLAG_PARITY; 1879f5a2f7feSPawel Jakub Dawidek sc->sc_round_robin++; 1880f5a2f7feSPawel Jakub Dawidek round_robin = 0; 1881dba915cfSPawel Jakub Dawidek } else if (verify && disk->d_no == sc->sc_ndisks - 1) { 1882dba915cfSPawel Jakub Dawidek cbp->bio_cflags |= G_RAID3_BIO_CFLAG_PARITY; 18832d1661a5SPawel Jakub Dawidek } 18842d1661a5SPawel Jakub Dawidek break; 18852d1661a5SPawel Jakub Dawidek case BIO_WRITE: 18862d1661a5SPawel Jakub Dawidek case BIO_DELETE: 18872d1661a5SPawel Jakub Dawidek if (disk->d_state == G_RAID3_DISK_STATE_ACTIVE || 18882d1661a5SPawel Jakub Dawidek disk->d_state == G_RAID3_DISK_STATE_SYNCHRONIZING) { 18892d1661a5SPawel Jakub Dawidek if (n == ndisks - 1) { 18902d1661a5SPawel Jakub Dawidek /* 18912d1661a5SPawel Jakub Dawidek * Active parity component, mark it as such. 18922d1661a5SPawel Jakub Dawidek */ 18932d1661a5SPawel Jakub Dawidek cbp->bio_cflags |= 18942d1661a5SPawel Jakub Dawidek G_RAID3_BIO_CFLAG_PARITY; 18952d1661a5SPawel Jakub Dawidek } 18962d1661a5SPawel Jakub Dawidek } else { 18972d1661a5SPawel Jakub Dawidek pbp->bio_pflags |= G_RAID3_BIO_PFLAG_DEGRADED; 18982d1661a5SPawel Jakub Dawidek if (n == ndisks - 1) { 18992d1661a5SPawel Jakub Dawidek /* 19002d1661a5SPawel Jakub Dawidek * Parity component is not connected, 19012d1661a5SPawel Jakub Dawidek * so destroy its request. 19022d1661a5SPawel Jakub Dawidek */ 19032d1661a5SPawel Jakub Dawidek pbp->bio_pflags |= 19042d1661a5SPawel Jakub Dawidek G_RAID3_BIO_PFLAG_NOPARITY; 19052d1661a5SPawel Jakub Dawidek g_raid3_destroy_bio(sc, cbp); 19062d1661a5SPawel Jakub Dawidek cbp = NULL; 19072d1661a5SPawel Jakub Dawidek } else { 19082d1661a5SPawel Jakub Dawidek cbp->bio_cflags |= 19092d1661a5SPawel Jakub Dawidek G_RAID3_BIO_CFLAG_NODISK; 19102d1661a5SPawel Jakub Dawidek disk = NULL; 19112d1661a5SPawel Jakub Dawidek } 19122d1661a5SPawel Jakub Dawidek } 19132d1661a5SPawel Jakub Dawidek break; 19142d1661a5SPawel Jakub Dawidek } 19152d1661a5SPawel Jakub Dawidek if (cbp != NULL) 19162d1661a5SPawel Jakub Dawidek cbp->bio_caller2 = disk; 19172d1661a5SPawel Jakub Dawidek } 19182d1661a5SPawel Jakub Dawidek switch (pbp->bio_cmd) { 19192d1661a5SPawel Jakub Dawidek case BIO_READ: 1920f5a2f7feSPawel Jakub Dawidek if (round_robin) { 1921f5a2f7feSPawel Jakub Dawidek /* 1922f5a2f7feSPawel Jakub Dawidek * If we are in round-robin mode and 'round_robin' is 1923f5a2f7feSPawel Jakub Dawidek * still 1, it means, that we skipped parity component 1924f5a2f7feSPawel Jakub Dawidek * for this read and must reset sc_round_robin field. 1925f5a2f7feSPawel Jakub Dawidek */ 1926f5a2f7feSPawel Jakub Dawidek sc->sc_round_robin = 0; 1927f5a2f7feSPawel Jakub Dawidek } 1928ee40c7aaSPawel Jakub Dawidek G_RAID3_FOREACH_SAFE_BIO(pbp, cbp, tmpbp) { 19292d1661a5SPawel Jakub Dawidek disk = cbp->bio_caller2; 19302d1661a5SPawel Jakub Dawidek cp = disk->d_consumer; 19312d1661a5SPawel Jakub Dawidek cbp->bio_to = cp->provider; 19322d1661a5SPawel Jakub Dawidek G_RAID3_LOGREQ(3, cbp, "Sending request."); 19333650be51SPawel Jakub Dawidek KASSERT(cp->acr >= 1 && cp->acw >= 1 && cp->ace >= 1, 19342d1661a5SPawel Jakub Dawidek ("Consumer %s not opened (r%dw%de%d).", 19352d1661a5SPawel Jakub Dawidek cp->provider->name, cp->acr, cp->acw, cp->ace)); 193679e61493SPawel Jakub Dawidek cp->index++; 19372d1661a5SPawel Jakub Dawidek g_io_request(cbp, cp); 19382d1661a5SPawel Jakub Dawidek } 19392d1661a5SPawel Jakub Dawidek break; 19402d1661a5SPawel Jakub Dawidek case BIO_WRITE: 19412d1661a5SPawel Jakub Dawidek case BIO_DELETE: 19422d1661a5SPawel Jakub Dawidek /* 19433650be51SPawel Jakub Dawidek * Put request onto inflight queue, so we can check if new 19443650be51SPawel Jakub Dawidek * synchronization requests don't collide with it. 19453650be51SPawel Jakub Dawidek */ 19463650be51SPawel Jakub Dawidek bioq_insert_tail(&sc->sc_inflight, pbp); 19473650be51SPawel Jakub Dawidek 19483650be51SPawel Jakub Dawidek /* 19492d1661a5SPawel Jakub Dawidek * Bump syncid on first write. 19502d1661a5SPawel Jakub Dawidek */ 1951ea973705SPawel Jakub Dawidek if ((sc->sc_bump_id & G_RAID3_BUMP_SYNCID) != 0) { 1952a245a548SPawel Jakub Dawidek sc->sc_bump_id &= ~G_RAID3_BUMP_SYNCID; 1953d97d5ee9SPawel Jakub Dawidek g_raid3_bump_syncid(sc); 19542d1661a5SPawel Jakub Dawidek } 19552d1661a5SPawel Jakub Dawidek g_raid3_scatter(pbp); 19562d1661a5SPawel Jakub Dawidek break; 19572d1661a5SPawel Jakub Dawidek } 19582d1661a5SPawel Jakub Dawidek return (0); 19592d1661a5SPawel Jakub Dawidek } 19602d1661a5SPawel Jakub Dawidek 19612d1661a5SPawel Jakub Dawidek static int 19622d1661a5SPawel Jakub Dawidek g_raid3_can_destroy(struct g_raid3_softc *sc) 19632d1661a5SPawel Jakub Dawidek { 19642d1661a5SPawel Jakub Dawidek struct g_geom *gp; 19652d1661a5SPawel Jakub Dawidek struct g_consumer *cp; 19662d1661a5SPawel Jakub Dawidek 19672d1661a5SPawel Jakub Dawidek g_topology_assert(); 19682d1661a5SPawel Jakub Dawidek gp = sc->sc_geom; 196918486a5eSPawel Jakub Dawidek if (gp->softc == NULL) 197018486a5eSPawel Jakub Dawidek return (1); 19712d1661a5SPawel Jakub Dawidek LIST_FOREACH(cp, &gp->consumer, consumer) { 19722d1661a5SPawel Jakub Dawidek if (g_raid3_is_busy(sc, cp)) 19732d1661a5SPawel Jakub Dawidek return (0); 19742d1661a5SPawel Jakub Dawidek } 19752d1661a5SPawel Jakub Dawidek gp = sc->sc_sync.ds_geom; 19762d1661a5SPawel Jakub Dawidek LIST_FOREACH(cp, &gp->consumer, consumer) { 19772d1661a5SPawel Jakub Dawidek if (g_raid3_is_busy(sc, cp)) 19782d1661a5SPawel Jakub Dawidek return (0); 19792d1661a5SPawel Jakub Dawidek } 19802d1661a5SPawel Jakub Dawidek G_RAID3_DEBUG(2, "No I/O requests for %s, it can be destroyed.", 19812d1661a5SPawel Jakub Dawidek sc->sc_name); 19822d1661a5SPawel Jakub Dawidek return (1); 19832d1661a5SPawel Jakub Dawidek } 19842d1661a5SPawel Jakub Dawidek 19852d1661a5SPawel Jakub Dawidek static int 19862d1661a5SPawel Jakub Dawidek g_raid3_try_destroy(struct g_raid3_softc *sc) 19872d1661a5SPawel Jakub Dawidek { 19882d1661a5SPawel Jakub Dawidek 19893650be51SPawel Jakub Dawidek g_topology_assert_not(); 19903650be51SPawel Jakub Dawidek sx_assert(&sc->sc_lock, SX_XLOCKED); 19913650be51SPawel Jakub Dawidek 19924ed854e8SPawel Jakub Dawidek if (sc->sc_rootmount != NULL) { 19934ed854e8SPawel Jakub Dawidek G_RAID3_DEBUG(1, "root_mount_rel[%u] %p", __LINE__, 19944ed854e8SPawel Jakub Dawidek sc->sc_rootmount); 19954ed854e8SPawel Jakub Dawidek root_mount_rel(sc->sc_rootmount); 19964ed854e8SPawel Jakub Dawidek sc->sc_rootmount = NULL; 19974ed854e8SPawel Jakub Dawidek } 19984ed854e8SPawel Jakub Dawidek 19992d1661a5SPawel Jakub Dawidek g_topology_lock(); 20002d1661a5SPawel Jakub Dawidek if (!g_raid3_can_destroy(sc)) { 20012d1661a5SPawel Jakub Dawidek g_topology_unlock(); 20022d1661a5SPawel Jakub Dawidek return (0); 20032d1661a5SPawel Jakub Dawidek } 200418486a5eSPawel Jakub Dawidek sc->sc_geom->softc = NULL; 200518486a5eSPawel Jakub Dawidek sc->sc_sync.ds_geom->softc = NULL; 2006a245a548SPawel Jakub Dawidek if ((sc->sc_flags & G_RAID3_DEVICE_FLAG_WAIT) != 0) { 20072d1661a5SPawel Jakub Dawidek g_topology_unlock(); 20082d1661a5SPawel Jakub Dawidek G_RAID3_DEBUG(4, "%s: Waking up %p.", __func__, 20092d1661a5SPawel Jakub Dawidek &sc->sc_worker); 20103650be51SPawel Jakub Dawidek /* Unlock sc_lock here, as it can be destroyed after wakeup. */ 20113650be51SPawel Jakub Dawidek sx_xunlock(&sc->sc_lock); 20122d1661a5SPawel Jakub Dawidek wakeup(&sc->sc_worker); 20132d1661a5SPawel Jakub Dawidek sc->sc_worker = NULL; 20142d1661a5SPawel Jakub Dawidek } else { 20152d1661a5SPawel Jakub Dawidek g_topology_unlock(); 20163650be51SPawel Jakub Dawidek g_raid3_destroy_device(sc); 20172d1661a5SPawel Jakub Dawidek free(sc->sc_disks, M_RAID3); 20182d1661a5SPawel Jakub Dawidek free(sc, M_RAID3); 20192d1661a5SPawel Jakub Dawidek } 20202d1661a5SPawel Jakub Dawidek return (1); 20212d1661a5SPawel Jakub Dawidek } 20222d1661a5SPawel Jakub Dawidek 20232d1661a5SPawel Jakub Dawidek /* 20242d1661a5SPawel Jakub Dawidek * Worker thread. 20252d1661a5SPawel Jakub Dawidek */ 20262d1661a5SPawel Jakub Dawidek static void 20272d1661a5SPawel Jakub Dawidek g_raid3_worker(void *arg) 20282d1661a5SPawel Jakub Dawidek { 20292d1661a5SPawel Jakub Dawidek struct g_raid3_softc *sc; 20302d1661a5SPawel Jakub Dawidek struct g_raid3_event *ep; 20312d1661a5SPawel Jakub Dawidek struct bio *bp; 20320962f942SPawel Jakub Dawidek int timeout; 20332d1661a5SPawel Jakub Dawidek 20342d1661a5SPawel Jakub Dawidek sc = arg; 2035982d11f8SJeff Roberson thread_lock(curthread); 203663710c4dSJohn Baldwin sched_prio(curthread, PRIBIO); 2037982d11f8SJeff Roberson thread_unlock(curthread); 20382d1661a5SPawel Jakub Dawidek 20393650be51SPawel Jakub Dawidek sx_xlock(&sc->sc_lock); 20402d1661a5SPawel Jakub Dawidek for (;;) { 20412d1661a5SPawel Jakub Dawidek G_RAID3_DEBUG(5, "%s: Let's see...", __func__); 20422d1661a5SPawel Jakub Dawidek /* 20432d1661a5SPawel Jakub Dawidek * First take a look at events. 20442d1661a5SPawel Jakub Dawidek * This is important to handle events before any I/O requests. 20452d1661a5SPawel Jakub Dawidek */ 20462d1661a5SPawel Jakub Dawidek ep = g_raid3_event_get(sc); 20473650be51SPawel Jakub Dawidek if (ep != NULL) { 2048d97d5ee9SPawel Jakub Dawidek g_raid3_event_remove(sc, ep); 20492d1661a5SPawel Jakub Dawidek if ((ep->e_flags & G_RAID3_EVENT_DEVICE) != 0) { 20502d1661a5SPawel Jakub Dawidek /* Update only device status. */ 20512d1661a5SPawel Jakub Dawidek G_RAID3_DEBUG(3, 20522d1661a5SPawel Jakub Dawidek "Running event for device %s.", 20532d1661a5SPawel Jakub Dawidek sc->sc_name); 20542d1661a5SPawel Jakub Dawidek ep->e_error = 0; 2055d97d5ee9SPawel Jakub Dawidek g_raid3_update_device(sc, 1); 20562d1661a5SPawel Jakub Dawidek } else { 20572d1661a5SPawel Jakub Dawidek /* Update disk status. */ 20582d1661a5SPawel Jakub Dawidek G_RAID3_DEBUG(3, "Running event for disk %s.", 20592d1661a5SPawel Jakub Dawidek g_raid3_get_diskname(ep->e_disk)); 20602d1661a5SPawel Jakub Dawidek ep->e_error = g_raid3_update_disk(ep->e_disk, 2061d97d5ee9SPawel Jakub Dawidek ep->e_state); 20622d1661a5SPawel Jakub Dawidek if (ep->e_error == 0) 2063d97d5ee9SPawel Jakub Dawidek g_raid3_update_device(sc, 0); 20642d1661a5SPawel Jakub Dawidek } 20652d1661a5SPawel Jakub Dawidek if ((ep->e_flags & G_RAID3_EVENT_DONTWAIT) != 0) { 20662d1661a5SPawel Jakub Dawidek KASSERT(ep->e_error == 0, 20672d1661a5SPawel Jakub Dawidek ("Error cannot be handled.")); 20682d1661a5SPawel Jakub Dawidek g_raid3_event_free(ep); 20692d1661a5SPawel Jakub Dawidek } else { 20702d1661a5SPawel Jakub Dawidek ep->e_flags |= G_RAID3_EVENT_DONE; 20712d1661a5SPawel Jakub Dawidek G_RAID3_DEBUG(4, "%s: Waking up %p.", __func__, 20722d1661a5SPawel Jakub Dawidek ep); 20732d1661a5SPawel Jakub Dawidek mtx_lock(&sc->sc_events_mtx); 20742d1661a5SPawel Jakub Dawidek wakeup(ep); 20752d1661a5SPawel Jakub Dawidek mtx_unlock(&sc->sc_events_mtx); 20762d1661a5SPawel Jakub Dawidek } 20772d1661a5SPawel Jakub Dawidek if ((sc->sc_flags & 20782d1661a5SPawel Jakub Dawidek G_RAID3_DEVICE_FLAG_DESTROY) != 0) { 20793650be51SPawel Jakub Dawidek if (g_raid3_try_destroy(sc)) { 20803650be51SPawel Jakub Dawidek curthread->td_pflags &= ~TDP_GEOM; 20813650be51SPawel Jakub Dawidek G_RAID3_DEBUG(1, "Thread exiting."); 20823745c395SJulian Elischer kproc_exit(0); 20832d1661a5SPawel Jakub Dawidek } 20843650be51SPawel Jakub Dawidek } 20852d1661a5SPawel Jakub Dawidek G_RAID3_DEBUG(5, "%s: I'm here 1.", __func__); 20862d1661a5SPawel Jakub Dawidek continue; 20872d1661a5SPawel Jakub Dawidek } 20882d1661a5SPawel Jakub Dawidek /* 20890962f942SPawel Jakub Dawidek * Check if we can mark array as CLEAN and if we can't take 20900962f942SPawel Jakub Dawidek * how much seconds should we wait. 20910962f942SPawel Jakub Dawidek */ 20923650be51SPawel Jakub Dawidek timeout = g_raid3_idle(sc, -1); 20930962f942SPawel Jakub Dawidek /* 20942d1661a5SPawel Jakub Dawidek * Now I/O requests. 20952d1661a5SPawel Jakub Dawidek */ 20962d1661a5SPawel Jakub Dawidek /* Get first request from the queue. */ 20972d1661a5SPawel Jakub Dawidek mtx_lock(&sc->sc_queue_mtx); 20982d1661a5SPawel Jakub Dawidek bp = bioq_first(&sc->sc_queue); 20992d1661a5SPawel Jakub Dawidek if (bp == NULL) { 21002d1661a5SPawel Jakub Dawidek if ((sc->sc_flags & 21012d1661a5SPawel Jakub Dawidek G_RAID3_DEVICE_FLAG_DESTROY) != 0) { 21022d1661a5SPawel Jakub Dawidek mtx_unlock(&sc->sc_queue_mtx); 21033650be51SPawel Jakub Dawidek if (g_raid3_try_destroy(sc)) { 21043650be51SPawel Jakub Dawidek curthread->td_pflags &= ~TDP_GEOM; 2105d7fad9f6SPawel Jakub Dawidek G_RAID3_DEBUG(1, "Thread exiting."); 21063745c395SJulian Elischer kproc_exit(0); 21073650be51SPawel Jakub Dawidek } 21082d1661a5SPawel Jakub Dawidek mtx_lock(&sc->sc_queue_mtx); 21092d1661a5SPawel Jakub Dawidek } 21103650be51SPawel Jakub Dawidek sx_xunlock(&sc->sc_lock); 2111a2fe5c66SPawel Jakub Dawidek /* 2112a2fe5c66SPawel Jakub Dawidek * XXX: We can miss an event here, because an event 2113a2fe5c66SPawel Jakub Dawidek * can be added without sx-device-lock and without 2114a2fe5c66SPawel Jakub Dawidek * mtx-queue-lock. Maybe I should just stop using 2115a2fe5c66SPawel Jakub Dawidek * dedicated mutex for events synchronization and 2116a2fe5c66SPawel Jakub Dawidek * stick with the queue lock? 2117a2fe5c66SPawel Jakub Dawidek * The event will hang here until next I/O request 2118a2fe5c66SPawel Jakub Dawidek * or next event is received. 2119a2fe5c66SPawel Jakub Dawidek */ 21200962f942SPawel Jakub Dawidek MSLEEP(sc, &sc->sc_queue_mtx, PRIBIO | PDROP, "r3:w1", 21210962f942SPawel Jakub Dawidek timeout * hz); 21223650be51SPawel Jakub Dawidek sx_xlock(&sc->sc_lock); 21239bb09163SPawel Jakub Dawidek G_RAID3_DEBUG(5, "%s: I'm here 4.", __func__); 21242d1661a5SPawel Jakub Dawidek continue; 21252d1661a5SPawel Jakub Dawidek } 212684edb86dSPawel Jakub Dawidek process: 21272d1661a5SPawel Jakub Dawidek bioq_remove(&sc->sc_queue, bp); 21282d1661a5SPawel Jakub Dawidek mtx_unlock(&sc->sc_queue_mtx); 21292d1661a5SPawel Jakub Dawidek 21308e007c52SPawel Jakub Dawidek if (bp->bio_from->geom == sc->sc_sync.ds_geom && 21318e007c52SPawel Jakub Dawidek (bp->bio_cflags & G_RAID3_BIO_CFLAG_SYNC) != 0) { 21328e007c52SPawel Jakub Dawidek g_raid3_sync_request(bp); /* READ */ 21338e007c52SPawel Jakub Dawidek } else if (bp->bio_to != sc->sc_provider) { 21343650be51SPawel Jakub Dawidek if ((bp->bio_cflags & G_RAID3_BIO_CFLAG_REGULAR) != 0) 21352d1661a5SPawel Jakub Dawidek g_raid3_regular_request(bp); 21363650be51SPawel Jakub Dawidek else if ((bp->bio_cflags & G_RAID3_BIO_CFLAG_SYNC) != 0) 21378e007c52SPawel Jakub Dawidek g_raid3_sync_request(bp); /* WRITE */ 2138de6f1c7cSPawel Jakub Dawidek else { 2139de6f1c7cSPawel Jakub Dawidek KASSERT(0, 2140de6f1c7cSPawel Jakub Dawidek ("Invalid request cflags=0x%hhx to=%s.", 2141de6f1c7cSPawel Jakub Dawidek bp->bio_cflags, bp->bio_to->name)); 2142de6f1c7cSPawel Jakub Dawidek } 2143de6f1c7cSPawel Jakub Dawidek } else if (g_raid3_register_request(bp) != 0) { 21442d1661a5SPawel Jakub Dawidek mtx_lock(&sc->sc_queue_mtx); 21453650be51SPawel Jakub Dawidek bioq_insert_head(&sc->sc_queue, bp); 214684edb86dSPawel Jakub Dawidek /* 214784edb86dSPawel Jakub Dawidek * We are short in memory, let see if there are finished 214884edb86dSPawel Jakub Dawidek * request we can free. 214984edb86dSPawel Jakub Dawidek */ 215084edb86dSPawel Jakub Dawidek TAILQ_FOREACH(bp, &sc->sc_queue.queue, bio_queue) { 215184edb86dSPawel Jakub Dawidek if (bp->bio_cflags & G_RAID3_BIO_CFLAG_REGULAR) 215284edb86dSPawel Jakub Dawidek goto process; 21532d1661a5SPawel Jakub Dawidek } 215484edb86dSPawel Jakub Dawidek /* 215584edb86dSPawel Jakub Dawidek * No finished regular request, so at least keep 215684edb86dSPawel Jakub Dawidek * synchronization running. 215784edb86dSPawel Jakub Dawidek */ 215884edb86dSPawel Jakub Dawidek TAILQ_FOREACH(bp, &sc->sc_queue.queue, bio_queue) { 215984edb86dSPawel Jakub Dawidek if (bp->bio_cflags & G_RAID3_BIO_CFLAG_SYNC) 216084edb86dSPawel Jakub Dawidek goto process; 216184edb86dSPawel Jakub Dawidek } 216284edb86dSPawel Jakub Dawidek sx_xunlock(&sc->sc_lock); 216384edb86dSPawel Jakub Dawidek MSLEEP(&sc->sc_queue, &sc->sc_queue_mtx, PRIBIO | PDROP, 216484edb86dSPawel Jakub Dawidek "r3:lowmem", hz / 10); 216584edb86dSPawel Jakub Dawidek sx_xlock(&sc->sc_lock); 21662d1661a5SPawel Jakub Dawidek } 2167d97d5ee9SPawel Jakub Dawidek G_RAID3_DEBUG(5, "%s: I'm here 9.", __func__); 21682d1661a5SPawel Jakub Dawidek } 21692d1661a5SPawel Jakub Dawidek } 21702d1661a5SPawel Jakub Dawidek 21712d1661a5SPawel Jakub Dawidek static void 21720962f942SPawel Jakub Dawidek g_raid3_update_idle(struct g_raid3_softc *sc, struct g_raid3_disk *disk) 21732d1661a5SPawel Jakub Dawidek { 21742d1661a5SPawel Jakub Dawidek 21753650be51SPawel Jakub Dawidek sx_assert(&sc->sc_lock, SX_LOCKED); 2176501250baSPawel Jakub Dawidek if ((sc->sc_flags & G_RAID3_DEVICE_FLAG_NOFAILSYNC) != 0) 2177501250baSPawel Jakub Dawidek return; 21780962f942SPawel Jakub Dawidek if (!sc->sc_idle && (disk->d_flags & G_RAID3_DISK_FLAG_DIRTY) == 0) { 21792d1661a5SPawel Jakub Dawidek G_RAID3_DEBUG(1, "Disk %s (device %s) marked as dirty.", 21803650be51SPawel Jakub Dawidek g_raid3_get_diskname(disk), sc->sc_name); 21812d1661a5SPawel Jakub Dawidek disk->d_flags |= G_RAID3_DISK_FLAG_DIRTY; 21820962f942SPawel Jakub Dawidek } else if (sc->sc_idle && 21830962f942SPawel Jakub Dawidek (disk->d_flags & G_RAID3_DISK_FLAG_DIRTY) != 0) { 21842d1661a5SPawel Jakub Dawidek G_RAID3_DEBUG(1, "Disk %s (device %s) marked as clean.", 21853650be51SPawel Jakub Dawidek g_raid3_get_diskname(disk), sc->sc_name); 21862d1661a5SPawel Jakub Dawidek disk->d_flags &= ~G_RAID3_DISK_FLAG_DIRTY; 21872d1661a5SPawel Jakub Dawidek } 21882d1661a5SPawel Jakub Dawidek } 21892d1661a5SPawel Jakub Dawidek 21902d1661a5SPawel Jakub Dawidek static void 21912d1661a5SPawel Jakub Dawidek g_raid3_sync_start(struct g_raid3_softc *sc) 21922d1661a5SPawel Jakub Dawidek { 21932d1661a5SPawel Jakub Dawidek struct g_raid3_disk *disk; 21943650be51SPawel Jakub Dawidek struct g_consumer *cp; 21953650be51SPawel Jakub Dawidek struct bio *bp; 21962d1661a5SPawel Jakub Dawidek int error; 21972d1661a5SPawel Jakub Dawidek u_int n; 21982d1661a5SPawel Jakub Dawidek 21993650be51SPawel Jakub Dawidek g_topology_assert_not(); 22003650be51SPawel Jakub Dawidek sx_assert(&sc->sc_lock, SX_XLOCKED); 22012d1661a5SPawel Jakub Dawidek 22022d1661a5SPawel Jakub Dawidek KASSERT(sc->sc_state == G_RAID3_DEVICE_STATE_DEGRADED, 22032d1661a5SPawel Jakub Dawidek ("Device not in DEGRADED state (%s, %u).", sc->sc_name, 22042d1661a5SPawel Jakub Dawidek sc->sc_state)); 22052d1661a5SPawel Jakub Dawidek KASSERT(sc->sc_syncdisk == NULL, ("Syncdisk is not NULL (%s, %u).", 22062d1661a5SPawel Jakub Dawidek sc->sc_name, sc->sc_state)); 22072d1661a5SPawel Jakub Dawidek disk = NULL; 22082d1661a5SPawel Jakub Dawidek for (n = 0; n < sc->sc_ndisks; n++) { 22092d1661a5SPawel Jakub Dawidek if (sc->sc_disks[n].d_state != G_RAID3_DISK_STATE_SYNCHRONIZING) 22102d1661a5SPawel Jakub Dawidek continue; 22112d1661a5SPawel Jakub Dawidek disk = &sc->sc_disks[n]; 22122d1661a5SPawel Jakub Dawidek break; 22132d1661a5SPawel Jakub Dawidek } 22142d1661a5SPawel Jakub Dawidek if (disk == NULL) 22152d1661a5SPawel Jakub Dawidek return; 22162d1661a5SPawel Jakub Dawidek 22173650be51SPawel Jakub Dawidek sx_xunlock(&sc->sc_lock); 22183650be51SPawel Jakub Dawidek g_topology_lock(); 22193650be51SPawel Jakub Dawidek cp = g_new_consumer(sc->sc_sync.ds_geom); 22203650be51SPawel Jakub Dawidek error = g_attach(cp, sc->sc_provider); 22213650be51SPawel Jakub Dawidek KASSERT(error == 0, 22223650be51SPawel Jakub Dawidek ("Cannot attach to %s (error=%d).", sc->sc_name, error)); 22233650be51SPawel Jakub Dawidek error = g_access(cp, 1, 0, 0); 22243650be51SPawel Jakub Dawidek KASSERT(error == 0, ("Cannot open %s (error=%d).", sc->sc_name, error)); 22253650be51SPawel Jakub Dawidek g_topology_unlock(); 22263650be51SPawel Jakub Dawidek sx_xlock(&sc->sc_lock); 22273650be51SPawel Jakub Dawidek 22282d1661a5SPawel Jakub Dawidek G_RAID3_DEBUG(0, "Device %s: rebuilding provider %s.", sc->sc_name, 22292d1661a5SPawel Jakub Dawidek g_raid3_get_diskname(disk)); 2230501250baSPawel Jakub Dawidek if ((sc->sc_flags & G_RAID3_DEVICE_FLAG_NOFAILSYNC) == 0) 22312d1661a5SPawel Jakub Dawidek disk->d_flags |= G_RAID3_DISK_FLAG_DIRTY; 22322d1661a5SPawel Jakub Dawidek KASSERT(disk->d_sync.ds_consumer == NULL, 22332d1661a5SPawel Jakub Dawidek ("Sync consumer already exists (device=%s, disk=%s).", 22342d1661a5SPawel Jakub Dawidek sc->sc_name, g_raid3_get_diskname(disk))); 22353650be51SPawel Jakub Dawidek 22363650be51SPawel Jakub Dawidek disk->d_sync.ds_consumer = cp; 22372d1661a5SPawel Jakub Dawidek disk->d_sync.ds_consumer->private = disk; 223879e61493SPawel Jakub Dawidek disk->d_sync.ds_consumer->index = 0; 22392d1661a5SPawel Jakub Dawidek sc->sc_syncdisk = disk; 22403650be51SPawel Jakub Dawidek 22413650be51SPawel Jakub Dawidek /* 22423650be51SPawel Jakub Dawidek * Allocate memory for synchronization bios and initialize them. 22433650be51SPawel Jakub Dawidek */ 22443650be51SPawel Jakub Dawidek disk->d_sync.ds_bios = malloc(sizeof(struct bio *) * g_raid3_syncreqs, 22453650be51SPawel Jakub Dawidek M_RAID3, M_WAITOK); 22463650be51SPawel Jakub Dawidek for (n = 0; n < g_raid3_syncreqs; n++) { 22473650be51SPawel Jakub Dawidek bp = g_alloc_bio(); 22483650be51SPawel Jakub Dawidek disk->d_sync.ds_bios[n] = bp; 22493650be51SPawel Jakub Dawidek bp->bio_parent = NULL; 22503650be51SPawel Jakub Dawidek bp->bio_cmd = BIO_READ; 22513650be51SPawel Jakub Dawidek bp->bio_data = malloc(MAXPHYS, M_RAID3, M_WAITOK); 22523650be51SPawel Jakub Dawidek bp->bio_cflags = 0; 22533650be51SPawel Jakub Dawidek bp->bio_offset = disk->d_sync.ds_offset * (sc->sc_ndisks - 1); 22543650be51SPawel Jakub Dawidek bp->bio_length = MIN(MAXPHYS, sc->sc_mediasize - bp->bio_offset); 22553650be51SPawel Jakub Dawidek disk->d_sync.ds_offset += bp->bio_length / (sc->sc_ndisks - 1); 22563650be51SPawel Jakub Dawidek bp->bio_done = g_raid3_sync_done; 22573650be51SPawel Jakub Dawidek bp->bio_from = disk->d_sync.ds_consumer; 22583650be51SPawel Jakub Dawidek bp->bio_to = sc->sc_provider; 2259ef25813dSRuslan Ermilov bp->bio_caller1 = (void *)(uintptr_t)n; 22603650be51SPawel Jakub Dawidek } 22613650be51SPawel Jakub Dawidek 22623650be51SPawel Jakub Dawidek /* Set the number of in-flight synchronization requests. */ 22633650be51SPawel Jakub Dawidek disk->d_sync.ds_inflight = g_raid3_syncreqs; 22643650be51SPawel Jakub Dawidek 22653650be51SPawel Jakub Dawidek /* 22663650be51SPawel Jakub Dawidek * Fire off first synchronization requests. 22673650be51SPawel Jakub Dawidek */ 22683650be51SPawel Jakub Dawidek for (n = 0; n < g_raid3_syncreqs; n++) { 22693650be51SPawel Jakub Dawidek bp = disk->d_sync.ds_bios[n]; 22703650be51SPawel Jakub Dawidek G_RAID3_LOGREQ(3, bp, "Sending synchronization request."); 22713650be51SPawel Jakub Dawidek disk->d_sync.ds_consumer->index++; 22723650be51SPawel Jakub Dawidek /* 22733650be51SPawel Jakub Dawidek * Delay the request if it is colliding with a regular request. 22743650be51SPawel Jakub Dawidek */ 22753650be51SPawel Jakub Dawidek if (g_raid3_regular_collision(sc, bp)) 22763650be51SPawel Jakub Dawidek g_raid3_sync_delay(sc, bp); 22773650be51SPawel Jakub Dawidek else 22783650be51SPawel Jakub Dawidek g_io_request(bp, disk->d_sync.ds_consumer); 22793650be51SPawel Jakub Dawidek } 22802d1661a5SPawel Jakub Dawidek } 22812d1661a5SPawel Jakub Dawidek 22822d1661a5SPawel Jakub Dawidek /* 22832d1661a5SPawel Jakub Dawidek * Stop synchronization process. 22842d1661a5SPawel Jakub Dawidek * type: 0 - synchronization finished 22852d1661a5SPawel Jakub Dawidek * 1 - synchronization stopped 22862d1661a5SPawel Jakub Dawidek */ 22872d1661a5SPawel Jakub Dawidek static void 22882d1661a5SPawel Jakub Dawidek g_raid3_sync_stop(struct g_raid3_softc *sc, int type) 22892d1661a5SPawel Jakub Dawidek { 22902d1661a5SPawel Jakub Dawidek struct g_raid3_disk *disk; 22913650be51SPawel Jakub Dawidek struct g_consumer *cp; 22922d1661a5SPawel Jakub Dawidek 22933650be51SPawel Jakub Dawidek g_topology_assert_not(); 22943650be51SPawel Jakub Dawidek sx_assert(&sc->sc_lock, SX_LOCKED); 22953650be51SPawel Jakub Dawidek 22962d1661a5SPawel Jakub Dawidek KASSERT(sc->sc_state == G_RAID3_DEVICE_STATE_DEGRADED, 22972d1661a5SPawel Jakub Dawidek ("Device not in DEGRADED state (%s, %u).", sc->sc_name, 22982d1661a5SPawel Jakub Dawidek sc->sc_state)); 22992d1661a5SPawel Jakub Dawidek disk = sc->sc_syncdisk; 23002d1661a5SPawel Jakub Dawidek sc->sc_syncdisk = NULL; 23012d1661a5SPawel Jakub Dawidek KASSERT(disk != NULL, ("No disk was synchronized (%s).", sc->sc_name)); 23022d1661a5SPawel Jakub Dawidek KASSERT(disk->d_state == G_RAID3_DISK_STATE_SYNCHRONIZING, 23032d1661a5SPawel Jakub Dawidek ("Wrong disk state (%s, %s).", g_raid3_get_diskname(disk), 23042d1661a5SPawel Jakub Dawidek g_raid3_disk_state2str(disk->d_state))); 23052d1661a5SPawel Jakub Dawidek if (disk->d_sync.ds_consumer == NULL) 23062d1661a5SPawel Jakub Dawidek return; 23072d1661a5SPawel Jakub Dawidek 23082d1661a5SPawel Jakub Dawidek if (type == 0) { 23092d1661a5SPawel Jakub Dawidek G_RAID3_DEBUG(0, "Device %s: rebuilding provider %s finished.", 23103650be51SPawel Jakub Dawidek sc->sc_name, g_raid3_get_diskname(disk)); 23112d1661a5SPawel Jakub Dawidek } else /* if (type == 1) */ { 23122d1661a5SPawel Jakub Dawidek G_RAID3_DEBUG(0, "Device %s: rebuilding provider %s stopped.", 23133650be51SPawel Jakub Dawidek sc->sc_name, g_raid3_get_diskname(disk)); 23142d1661a5SPawel Jakub Dawidek } 23153650be51SPawel Jakub Dawidek free(disk->d_sync.ds_bios, M_RAID3); 23163650be51SPawel Jakub Dawidek disk->d_sync.ds_bios = NULL; 23173650be51SPawel Jakub Dawidek cp = disk->d_sync.ds_consumer; 23182d1661a5SPawel Jakub Dawidek disk->d_sync.ds_consumer = NULL; 23192d1661a5SPawel Jakub Dawidek disk->d_flags &= ~G_RAID3_DISK_FLAG_DIRTY; 23203650be51SPawel Jakub Dawidek sx_xunlock(&sc->sc_lock); /* Avoid recursion on sc_lock. */ 23213650be51SPawel Jakub Dawidek g_topology_lock(); 23223650be51SPawel Jakub Dawidek g_raid3_kill_consumer(sc, cp); 23233650be51SPawel Jakub Dawidek g_topology_unlock(); 23243650be51SPawel Jakub Dawidek sx_xlock(&sc->sc_lock); 23252d1661a5SPawel Jakub Dawidek } 23262d1661a5SPawel Jakub Dawidek 23272d1661a5SPawel Jakub Dawidek static void 23282d1661a5SPawel Jakub Dawidek g_raid3_launch_provider(struct g_raid3_softc *sc) 23292d1661a5SPawel Jakub Dawidek { 23302d1661a5SPawel Jakub Dawidek struct g_provider *pp; 2331113d8e50SAlexander Motin struct g_raid3_disk *disk; 2332113d8e50SAlexander Motin int n; 23332d1661a5SPawel Jakub Dawidek 23343650be51SPawel Jakub Dawidek sx_assert(&sc->sc_lock, SX_LOCKED); 23352d1661a5SPawel Jakub Dawidek 23363650be51SPawel Jakub Dawidek g_topology_lock(); 23372d1661a5SPawel Jakub Dawidek pp = g_new_providerf(sc->sc_geom, "raid3/%s", sc->sc_name); 23382d1661a5SPawel Jakub Dawidek pp->mediasize = sc->sc_mediasize; 23392d1661a5SPawel Jakub Dawidek pp->sectorsize = sc->sc_sectorsize; 2340113d8e50SAlexander Motin pp->stripesize = 0; 2341113d8e50SAlexander Motin pp->stripeoffset = 0; 2342113d8e50SAlexander Motin for (n = 0; n < sc->sc_ndisks; n++) { 2343113d8e50SAlexander Motin disk = &sc->sc_disks[n]; 2344113d8e50SAlexander Motin if (disk->d_consumer && disk->d_consumer->provider && 2345113d8e50SAlexander Motin disk->d_consumer->provider->stripesize > pp->stripesize) { 2346113d8e50SAlexander Motin pp->stripesize = disk->d_consumer->provider->stripesize; 2347113d8e50SAlexander Motin pp->stripeoffset = disk->d_consumer->provider->stripeoffset; 2348113d8e50SAlexander Motin } 2349113d8e50SAlexander Motin } 2350113d8e50SAlexander Motin pp->stripesize *= sc->sc_ndisks - 1; 2351113d8e50SAlexander Motin pp->stripeoffset *= sc->sc_ndisks - 1; 23522d1661a5SPawel Jakub Dawidek sc->sc_provider = pp; 23532d1661a5SPawel Jakub Dawidek g_error_provider(pp, 0); 23543650be51SPawel Jakub Dawidek g_topology_unlock(); 23550cca572eSJohn-Mark Gurney G_RAID3_DEBUG(0, "Device %s launched (%u/%u).", pp->name, 23560cca572eSJohn-Mark Gurney g_raid3_ndisks(sc, G_RAID3_DISK_STATE_ACTIVE), sc->sc_ndisks); 23570cca572eSJohn-Mark Gurney 23582d1661a5SPawel Jakub Dawidek if (sc->sc_state == G_RAID3_DEVICE_STATE_DEGRADED) 23592d1661a5SPawel Jakub Dawidek g_raid3_sync_start(sc); 23602d1661a5SPawel Jakub Dawidek } 23612d1661a5SPawel Jakub Dawidek 23622d1661a5SPawel Jakub Dawidek static void 23632d1661a5SPawel Jakub Dawidek g_raid3_destroy_provider(struct g_raid3_softc *sc) 23642d1661a5SPawel Jakub Dawidek { 23652d1661a5SPawel Jakub Dawidek struct bio *bp; 23662d1661a5SPawel Jakub Dawidek 23673650be51SPawel Jakub Dawidek g_topology_assert_not(); 23682d1661a5SPawel Jakub Dawidek KASSERT(sc->sc_provider != NULL, ("NULL provider (device=%s).", 23692d1661a5SPawel Jakub Dawidek sc->sc_name)); 23702d1661a5SPawel Jakub Dawidek 23713650be51SPawel Jakub Dawidek g_topology_lock(); 23722d1661a5SPawel Jakub Dawidek g_error_provider(sc->sc_provider, ENXIO); 23732d1661a5SPawel Jakub Dawidek mtx_lock(&sc->sc_queue_mtx); 23742d1661a5SPawel Jakub Dawidek while ((bp = bioq_first(&sc->sc_queue)) != NULL) { 23752d1661a5SPawel Jakub Dawidek bioq_remove(&sc->sc_queue, bp); 23762d1661a5SPawel Jakub Dawidek g_io_deliver(bp, ENXIO); 23772d1661a5SPawel Jakub Dawidek } 23782d1661a5SPawel Jakub Dawidek mtx_unlock(&sc->sc_queue_mtx); 23792d1661a5SPawel Jakub Dawidek G_RAID3_DEBUG(0, "Device %s: provider %s destroyed.", sc->sc_name, 23802d1661a5SPawel Jakub Dawidek sc->sc_provider->name); 23812d1661a5SPawel Jakub Dawidek sc->sc_provider->flags |= G_PF_WITHER; 23822d1661a5SPawel Jakub Dawidek g_orphan_provider(sc->sc_provider, ENXIO); 23833650be51SPawel Jakub Dawidek g_topology_unlock(); 23842d1661a5SPawel Jakub Dawidek sc->sc_provider = NULL; 23852d1661a5SPawel Jakub Dawidek if (sc->sc_syncdisk != NULL) 23862d1661a5SPawel Jakub Dawidek g_raid3_sync_stop(sc, 1); 23872d1661a5SPawel Jakub Dawidek } 23882d1661a5SPawel Jakub Dawidek 23892d1661a5SPawel Jakub Dawidek static void 23902d1661a5SPawel Jakub Dawidek g_raid3_go(void *arg) 23912d1661a5SPawel Jakub Dawidek { 23922d1661a5SPawel Jakub Dawidek struct g_raid3_softc *sc; 23932d1661a5SPawel Jakub Dawidek 23942d1661a5SPawel Jakub Dawidek sc = arg; 23952d1661a5SPawel Jakub Dawidek G_RAID3_DEBUG(0, "Force device %s start due to timeout.", sc->sc_name); 23962d1661a5SPawel Jakub Dawidek g_raid3_event_send(sc, 0, 23972d1661a5SPawel Jakub Dawidek G_RAID3_EVENT_DONTWAIT | G_RAID3_EVENT_DEVICE); 23982d1661a5SPawel Jakub Dawidek } 23992d1661a5SPawel Jakub Dawidek 24002d1661a5SPawel Jakub Dawidek static u_int 24012d1661a5SPawel Jakub Dawidek g_raid3_determine_state(struct g_raid3_disk *disk) 24022d1661a5SPawel Jakub Dawidek { 24032d1661a5SPawel Jakub Dawidek struct g_raid3_softc *sc; 24042d1661a5SPawel Jakub Dawidek u_int state; 24052d1661a5SPawel Jakub Dawidek 24062d1661a5SPawel Jakub Dawidek sc = disk->d_softc; 24072d1661a5SPawel Jakub Dawidek if (sc->sc_syncid == disk->d_sync.ds_syncid) { 24082d1661a5SPawel Jakub Dawidek if ((disk->d_flags & 24092d1661a5SPawel Jakub Dawidek G_RAID3_DISK_FLAG_SYNCHRONIZING) == 0) { 24102d1661a5SPawel Jakub Dawidek /* Disk does not need synchronization. */ 24112d1661a5SPawel Jakub Dawidek state = G_RAID3_DISK_STATE_ACTIVE; 24122d1661a5SPawel Jakub Dawidek } else { 24132d1661a5SPawel Jakub Dawidek if ((sc->sc_flags & 24142d1661a5SPawel Jakub Dawidek G_RAID3_DEVICE_FLAG_NOAUTOSYNC) == 0 || 24152d1661a5SPawel Jakub Dawidek (disk->d_flags & 24162d1661a5SPawel Jakub Dawidek G_RAID3_DISK_FLAG_FORCE_SYNC) != 0) { 24172d1661a5SPawel Jakub Dawidek /* 24182d1661a5SPawel Jakub Dawidek * We can start synchronization from 24192d1661a5SPawel Jakub Dawidek * the stored offset. 24202d1661a5SPawel Jakub Dawidek */ 24212d1661a5SPawel Jakub Dawidek state = G_RAID3_DISK_STATE_SYNCHRONIZING; 24222d1661a5SPawel Jakub Dawidek } else { 24232d1661a5SPawel Jakub Dawidek state = G_RAID3_DISK_STATE_STALE; 24242d1661a5SPawel Jakub Dawidek } 24252d1661a5SPawel Jakub Dawidek } 24262d1661a5SPawel Jakub Dawidek } else if (disk->d_sync.ds_syncid < sc->sc_syncid) { 24272d1661a5SPawel Jakub Dawidek /* 24282d1661a5SPawel Jakub Dawidek * Reset all synchronization data for this disk, 24292d1661a5SPawel Jakub Dawidek * because if it even was synchronized, it was 24302d1661a5SPawel Jakub Dawidek * synchronized to disks with different syncid. 24312d1661a5SPawel Jakub Dawidek */ 24322d1661a5SPawel Jakub Dawidek disk->d_flags |= G_RAID3_DISK_FLAG_SYNCHRONIZING; 24332d1661a5SPawel Jakub Dawidek disk->d_sync.ds_offset = 0; 24342d1661a5SPawel Jakub Dawidek disk->d_sync.ds_offset_done = 0; 24352d1661a5SPawel Jakub Dawidek disk->d_sync.ds_syncid = sc->sc_syncid; 24362d1661a5SPawel Jakub Dawidek if ((sc->sc_flags & G_RAID3_DEVICE_FLAG_NOAUTOSYNC) == 0 || 24372d1661a5SPawel Jakub Dawidek (disk->d_flags & G_RAID3_DISK_FLAG_FORCE_SYNC) != 0) { 24382d1661a5SPawel Jakub Dawidek state = G_RAID3_DISK_STATE_SYNCHRONIZING; 24392d1661a5SPawel Jakub Dawidek } else { 24402d1661a5SPawel Jakub Dawidek state = G_RAID3_DISK_STATE_STALE; 24412d1661a5SPawel Jakub Dawidek } 24422d1661a5SPawel Jakub Dawidek } else /* if (sc->sc_syncid < disk->d_sync.ds_syncid) */ { 24432d1661a5SPawel Jakub Dawidek /* 24442d1661a5SPawel Jakub Dawidek * Not good, NOT GOOD! 24452d1661a5SPawel Jakub Dawidek * It means that device was started on stale disks 24462d1661a5SPawel Jakub Dawidek * and more fresh disk just arrive. 24473c57a41dSPawel Jakub Dawidek * If there were writes, device is broken, sorry. 24482d1661a5SPawel Jakub Dawidek * I think the best choice here is don't touch 2449776fc0e9SYaroslav Tykhiy * this disk and inform the user loudly. 24502d1661a5SPawel Jakub Dawidek */ 24512d1661a5SPawel Jakub Dawidek G_RAID3_DEBUG(0, "Device %s was started before the freshest " 24522d1661a5SPawel Jakub Dawidek "disk (%s) arrives!! It will not be connected to the " 24532d1661a5SPawel Jakub Dawidek "running device.", sc->sc_name, 24542d1661a5SPawel Jakub Dawidek g_raid3_get_diskname(disk)); 24552d1661a5SPawel Jakub Dawidek g_raid3_destroy_disk(disk); 24562d1661a5SPawel Jakub Dawidek state = G_RAID3_DISK_STATE_NONE; 24572d1661a5SPawel Jakub Dawidek /* Return immediately, because disk was destroyed. */ 24582d1661a5SPawel Jakub Dawidek return (state); 24592d1661a5SPawel Jakub Dawidek } 24602d1661a5SPawel Jakub Dawidek G_RAID3_DEBUG(3, "State for %s disk: %s.", 24612d1661a5SPawel Jakub Dawidek g_raid3_get_diskname(disk), g_raid3_disk_state2str(state)); 24622d1661a5SPawel Jakub Dawidek return (state); 24632d1661a5SPawel Jakub Dawidek } 24642d1661a5SPawel Jakub Dawidek 24652d1661a5SPawel Jakub Dawidek /* 24662d1661a5SPawel Jakub Dawidek * Update device state. 24672d1661a5SPawel Jakub Dawidek */ 24682d1661a5SPawel Jakub Dawidek static void 2469d97d5ee9SPawel Jakub Dawidek g_raid3_update_device(struct g_raid3_softc *sc, boolean_t force) 24702d1661a5SPawel Jakub Dawidek { 24712d1661a5SPawel Jakub Dawidek struct g_raid3_disk *disk; 24722d1661a5SPawel Jakub Dawidek u_int state; 24732d1661a5SPawel Jakub Dawidek 24743650be51SPawel Jakub Dawidek sx_assert(&sc->sc_lock, SX_XLOCKED); 24752d1661a5SPawel Jakub Dawidek 24762d1661a5SPawel Jakub Dawidek switch (sc->sc_state) { 24772d1661a5SPawel Jakub Dawidek case G_RAID3_DEVICE_STATE_STARTING: 24782d1661a5SPawel Jakub Dawidek { 2479a245a548SPawel Jakub Dawidek u_int n, ndirty, ndisks, genid, syncid; 24802d1661a5SPawel Jakub Dawidek 24812d1661a5SPawel Jakub Dawidek KASSERT(sc->sc_provider == NULL, 24822d1661a5SPawel Jakub Dawidek ("Non-NULL provider in STARTING state (%s).", sc->sc_name)); 24832d1661a5SPawel Jakub Dawidek /* 24842d1661a5SPawel Jakub Dawidek * Are we ready? We are, if all disks are connected or 24852d1661a5SPawel Jakub Dawidek * one disk is missing and 'force' is true. 24862d1661a5SPawel Jakub Dawidek */ 24872d1661a5SPawel Jakub Dawidek if (g_raid3_ndisks(sc, -1) + force == sc->sc_ndisks) { 24882d1661a5SPawel Jakub Dawidek if (!force) 24892d1661a5SPawel Jakub Dawidek callout_drain(&sc->sc_callout); 24902d1661a5SPawel Jakub Dawidek } else { 24912d1661a5SPawel Jakub Dawidek if (force) { 24922d1661a5SPawel Jakub Dawidek /* 24932d1661a5SPawel Jakub Dawidek * Timeout expired, so destroy device. 24942d1661a5SPawel Jakub Dawidek */ 24952d1661a5SPawel Jakub Dawidek sc->sc_flags |= G_RAID3_DEVICE_FLAG_DESTROY; 24964ed854e8SPawel Jakub Dawidek G_RAID3_DEBUG(1, "root_mount_rel[%u] %p", 24974ed854e8SPawel Jakub Dawidek __LINE__, sc->sc_rootmount); 24984ed854e8SPawel Jakub Dawidek root_mount_rel(sc->sc_rootmount); 24994ed854e8SPawel Jakub Dawidek sc->sc_rootmount = NULL; 25002d1661a5SPawel Jakub Dawidek } 25012d1661a5SPawel Jakub Dawidek return; 25022d1661a5SPawel Jakub Dawidek } 25032d1661a5SPawel Jakub Dawidek 25042d1661a5SPawel Jakub Dawidek /* 2505a245a548SPawel Jakub Dawidek * Find the biggest genid. 2506a245a548SPawel Jakub Dawidek */ 2507a245a548SPawel Jakub Dawidek genid = 0; 2508a245a548SPawel Jakub Dawidek for (n = 0; n < sc->sc_ndisks; n++) { 2509a245a548SPawel Jakub Dawidek disk = &sc->sc_disks[n]; 2510a245a548SPawel Jakub Dawidek if (disk->d_state == G_RAID3_DISK_STATE_NODISK) 2511a245a548SPawel Jakub Dawidek continue; 2512a245a548SPawel Jakub Dawidek if (disk->d_genid > genid) 2513a245a548SPawel Jakub Dawidek genid = disk->d_genid; 2514a245a548SPawel Jakub Dawidek } 2515a245a548SPawel Jakub Dawidek sc->sc_genid = genid; 2516a245a548SPawel Jakub Dawidek /* 2517a245a548SPawel Jakub Dawidek * Remove all disks without the biggest genid. 2518a245a548SPawel Jakub Dawidek */ 2519a245a548SPawel Jakub Dawidek for (n = 0; n < sc->sc_ndisks; n++) { 2520a245a548SPawel Jakub Dawidek disk = &sc->sc_disks[n]; 2521a245a548SPawel Jakub Dawidek if (disk->d_state == G_RAID3_DISK_STATE_NODISK) 2522a245a548SPawel Jakub Dawidek continue; 2523a245a548SPawel Jakub Dawidek if (disk->d_genid < genid) { 2524a245a548SPawel Jakub Dawidek G_RAID3_DEBUG(0, 2525a245a548SPawel Jakub Dawidek "Component %s (device %s) broken, skipping.", 2526a245a548SPawel Jakub Dawidek g_raid3_get_diskname(disk), sc->sc_name); 2527a245a548SPawel Jakub Dawidek g_raid3_destroy_disk(disk); 2528a245a548SPawel Jakub Dawidek } 2529a245a548SPawel Jakub Dawidek } 2530a245a548SPawel Jakub Dawidek 2531a245a548SPawel Jakub Dawidek /* 25322d1661a5SPawel Jakub Dawidek * There must be at least 'sc->sc_ndisks - 1' components 25332d1661a5SPawel Jakub Dawidek * with the same syncid and without SYNCHRONIZING flag. 25342d1661a5SPawel Jakub Dawidek */ 25352d1661a5SPawel Jakub Dawidek 25362d1661a5SPawel Jakub Dawidek /* 25372d1661a5SPawel Jakub Dawidek * Find the biggest syncid, number of valid components and 25382d1661a5SPawel Jakub Dawidek * number of dirty components. 25392d1661a5SPawel Jakub Dawidek */ 25402d1661a5SPawel Jakub Dawidek ndirty = ndisks = syncid = 0; 25412d1661a5SPawel Jakub Dawidek for (n = 0; n < sc->sc_ndisks; n++) { 25422d1661a5SPawel Jakub Dawidek disk = &sc->sc_disks[n]; 25432d1661a5SPawel Jakub Dawidek if (disk->d_state == G_RAID3_DISK_STATE_NODISK) 25442d1661a5SPawel Jakub Dawidek continue; 25452d1661a5SPawel Jakub Dawidek if ((disk->d_flags & G_RAID3_DISK_FLAG_DIRTY) != 0) 25462d1661a5SPawel Jakub Dawidek ndirty++; 25472d1661a5SPawel Jakub Dawidek if (disk->d_sync.ds_syncid > syncid) { 25482d1661a5SPawel Jakub Dawidek syncid = disk->d_sync.ds_syncid; 25492d1661a5SPawel Jakub Dawidek ndisks = 0; 25502d1661a5SPawel Jakub Dawidek } else if (disk->d_sync.ds_syncid < syncid) { 25512d1661a5SPawel Jakub Dawidek continue; 25522d1661a5SPawel Jakub Dawidek } 25532d1661a5SPawel Jakub Dawidek if ((disk->d_flags & 25542d1661a5SPawel Jakub Dawidek G_RAID3_DISK_FLAG_SYNCHRONIZING) != 0) { 25552d1661a5SPawel Jakub Dawidek continue; 25562d1661a5SPawel Jakub Dawidek } 25572d1661a5SPawel Jakub Dawidek ndisks++; 25582d1661a5SPawel Jakub Dawidek } 25592d1661a5SPawel Jakub Dawidek /* 25602d1661a5SPawel Jakub Dawidek * Do we have enough valid components? 25612d1661a5SPawel Jakub Dawidek */ 25622d1661a5SPawel Jakub Dawidek if (ndisks + 1 < sc->sc_ndisks) { 25632d1661a5SPawel Jakub Dawidek G_RAID3_DEBUG(0, 25642d1661a5SPawel Jakub Dawidek "Device %s is broken, too few valid components.", 25652d1661a5SPawel Jakub Dawidek sc->sc_name); 25662d1661a5SPawel Jakub Dawidek sc->sc_flags |= G_RAID3_DEVICE_FLAG_DESTROY; 25672d1661a5SPawel Jakub Dawidek return; 25682d1661a5SPawel Jakub Dawidek } 25692d1661a5SPawel Jakub Dawidek /* 25702d1661a5SPawel Jakub Dawidek * If there is one DIRTY component and all disks are present, 25712d1661a5SPawel Jakub Dawidek * mark it for synchronization. If there is more than one DIRTY 25722d1661a5SPawel Jakub Dawidek * component, mark parity component for synchronization. 25732d1661a5SPawel Jakub Dawidek */ 25742d1661a5SPawel Jakub Dawidek if (ndisks == sc->sc_ndisks && ndirty == 1) { 25752d1661a5SPawel Jakub Dawidek for (n = 0; n < sc->sc_ndisks; n++) { 25762d1661a5SPawel Jakub Dawidek disk = &sc->sc_disks[n]; 25772d1661a5SPawel Jakub Dawidek if ((disk->d_flags & 25782d1661a5SPawel Jakub Dawidek G_RAID3_DISK_FLAG_DIRTY) == 0) { 25792d1661a5SPawel Jakub Dawidek continue; 25802d1661a5SPawel Jakub Dawidek } 25812d1661a5SPawel Jakub Dawidek disk->d_flags |= 25822d1661a5SPawel Jakub Dawidek G_RAID3_DISK_FLAG_SYNCHRONIZING; 25832d1661a5SPawel Jakub Dawidek } 25842d1661a5SPawel Jakub Dawidek } else if (ndisks == sc->sc_ndisks && ndirty > 1) { 25852d1661a5SPawel Jakub Dawidek disk = &sc->sc_disks[sc->sc_ndisks - 1]; 25862d1661a5SPawel Jakub Dawidek disk->d_flags |= G_RAID3_DISK_FLAG_SYNCHRONIZING; 25872d1661a5SPawel Jakub Dawidek } 25882d1661a5SPawel Jakub Dawidek 25892d1661a5SPawel Jakub Dawidek sc->sc_syncid = syncid; 25902d1661a5SPawel Jakub Dawidek if (force) { 25912d1661a5SPawel Jakub Dawidek /* Remember to bump syncid on first write. */ 2592ea973705SPawel Jakub Dawidek sc->sc_bump_id |= G_RAID3_BUMP_SYNCID; 25932d1661a5SPawel Jakub Dawidek } 25942d1661a5SPawel Jakub Dawidek if (ndisks == sc->sc_ndisks) 25952d1661a5SPawel Jakub Dawidek state = G_RAID3_DEVICE_STATE_COMPLETE; 25962d1661a5SPawel Jakub Dawidek else /* if (ndisks == sc->sc_ndisks - 1) */ 25972d1661a5SPawel Jakub Dawidek state = G_RAID3_DEVICE_STATE_DEGRADED; 25982d1661a5SPawel Jakub Dawidek G_RAID3_DEBUG(1, "Device %s state changed from %s to %s.", 25992d1661a5SPawel Jakub Dawidek sc->sc_name, g_raid3_device_state2str(sc->sc_state), 26002d1661a5SPawel Jakub Dawidek g_raid3_device_state2str(state)); 26012d1661a5SPawel Jakub Dawidek sc->sc_state = state; 26022d1661a5SPawel Jakub Dawidek for (n = 0; n < sc->sc_ndisks; n++) { 26032d1661a5SPawel Jakub Dawidek disk = &sc->sc_disks[n]; 26042d1661a5SPawel Jakub Dawidek if (disk->d_state == G_RAID3_DISK_STATE_NODISK) 26052d1661a5SPawel Jakub Dawidek continue; 26062d1661a5SPawel Jakub Dawidek state = g_raid3_determine_state(disk); 26072d1661a5SPawel Jakub Dawidek g_raid3_event_send(disk, state, G_RAID3_EVENT_DONTWAIT); 2608a245a548SPawel Jakub Dawidek if (state == G_RAID3_DISK_STATE_STALE) 2609ea973705SPawel Jakub Dawidek sc->sc_bump_id |= G_RAID3_BUMP_SYNCID; 26102d1661a5SPawel Jakub Dawidek } 26112d1661a5SPawel Jakub Dawidek break; 26122d1661a5SPawel Jakub Dawidek } 26132d1661a5SPawel Jakub Dawidek case G_RAID3_DEVICE_STATE_DEGRADED: 26142d1661a5SPawel Jakub Dawidek /* 2615ea973705SPawel Jakub Dawidek * Genid need to be bumped immediately, so do it here. 26162d1661a5SPawel Jakub Dawidek */ 2617ea973705SPawel Jakub Dawidek if ((sc->sc_bump_id & G_RAID3_BUMP_GENID) != 0) { 2618a245a548SPawel Jakub Dawidek sc->sc_bump_id &= ~G_RAID3_BUMP_GENID; 2619a245a548SPawel Jakub Dawidek g_raid3_bump_genid(sc); 2620a245a548SPawel Jakub Dawidek } 2621a245a548SPawel Jakub Dawidek 26222d1661a5SPawel Jakub Dawidek if (g_raid3_ndisks(sc, G_RAID3_DISK_STATE_NEW) > 0) 26232d1661a5SPawel Jakub Dawidek return; 26242d1661a5SPawel Jakub Dawidek if (g_raid3_ndisks(sc, G_RAID3_DISK_STATE_ACTIVE) < 26252d1661a5SPawel Jakub Dawidek sc->sc_ndisks - 1) { 26262d1661a5SPawel Jakub Dawidek if (sc->sc_provider != NULL) 26272d1661a5SPawel Jakub Dawidek g_raid3_destroy_provider(sc); 26282d1661a5SPawel Jakub Dawidek sc->sc_flags |= G_RAID3_DEVICE_FLAG_DESTROY; 26292d1661a5SPawel Jakub Dawidek return; 26302d1661a5SPawel Jakub Dawidek } 26312d1661a5SPawel Jakub Dawidek if (g_raid3_ndisks(sc, G_RAID3_DISK_STATE_ACTIVE) == 26322d1661a5SPawel Jakub Dawidek sc->sc_ndisks) { 26332d1661a5SPawel Jakub Dawidek state = G_RAID3_DEVICE_STATE_COMPLETE; 26342d1661a5SPawel Jakub Dawidek G_RAID3_DEBUG(1, 26352d1661a5SPawel Jakub Dawidek "Device %s state changed from %s to %s.", 26362d1661a5SPawel Jakub Dawidek sc->sc_name, g_raid3_device_state2str(sc->sc_state), 26372d1661a5SPawel Jakub Dawidek g_raid3_device_state2str(state)); 26382d1661a5SPawel Jakub Dawidek sc->sc_state = state; 26392d1661a5SPawel Jakub Dawidek } 26402d1661a5SPawel Jakub Dawidek if (sc->sc_provider == NULL) 26412d1661a5SPawel Jakub Dawidek g_raid3_launch_provider(sc); 26424ed854e8SPawel Jakub Dawidek if (sc->sc_rootmount != NULL) { 26434ed854e8SPawel Jakub Dawidek G_RAID3_DEBUG(1, "root_mount_rel[%u] %p", __LINE__, 26444ed854e8SPawel Jakub Dawidek sc->sc_rootmount); 26454ed854e8SPawel Jakub Dawidek root_mount_rel(sc->sc_rootmount); 26464ed854e8SPawel Jakub Dawidek sc->sc_rootmount = NULL; 26474ed854e8SPawel Jakub Dawidek } 26482d1661a5SPawel Jakub Dawidek break; 26492d1661a5SPawel Jakub Dawidek case G_RAID3_DEVICE_STATE_COMPLETE: 26502d1661a5SPawel Jakub Dawidek /* 2651ea973705SPawel Jakub Dawidek * Genid need to be bumped immediately, so do it here. 26522d1661a5SPawel Jakub Dawidek */ 2653ea973705SPawel Jakub Dawidek if ((sc->sc_bump_id & G_RAID3_BUMP_GENID) != 0) { 2654a245a548SPawel Jakub Dawidek sc->sc_bump_id &= ~G_RAID3_BUMP_GENID; 2655a245a548SPawel Jakub Dawidek g_raid3_bump_genid(sc); 2656a245a548SPawel Jakub Dawidek } 2657a245a548SPawel Jakub Dawidek 26582d1661a5SPawel Jakub Dawidek if (g_raid3_ndisks(sc, G_RAID3_DISK_STATE_NEW) > 0) 26592d1661a5SPawel Jakub Dawidek return; 26602d1661a5SPawel Jakub Dawidek KASSERT(g_raid3_ndisks(sc, G_RAID3_DISK_STATE_ACTIVE) >= 26612d1661a5SPawel Jakub Dawidek sc->sc_ndisks - 1, 26622d1661a5SPawel Jakub Dawidek ("Too few ACTIVE components in COMPLETE state (device %s).", 26632d1661a5SPawel Jakub Dawidek sc->sc_name)); 26642d1661a5SPawel Jakub Dawidek if (g_raid3_ndisks(sc, G_RAID3_DISK_STATE_ACTIVE) == 26652d1661a5SPawel Jakub Dawidek sc->sc_ndisks - 1) { 26662d1661a5SPawel Jakub Dawidek state = G_RAID3_DEVICE_STATE_DEGRADED; 26672d1661a5SPawel Jakub Dawidek G_RAID3_DEBUG(1, 26682d1661a5SPawel Jakub Dawidek "Device %s state changed from %s to %s.", 26692d1661a5SPawel Jakub Dawidek sc->sc_name, g_raid3_device_state2str(sc->sc_state), 26702d1661a5SPawel Jakub Dawidek g_raid3_device_state2str(state)); 26712d1661a5SPawel Jakub Dawidek sc->sc_state = state; 26722d1661a5SPawel Jakub Dawidek } 26732d1661a5SPawel Jakub Dawidek if (sc->sc_provider == NULL) 26742d1661a5SPawel Jakub Dawidek g_raid3_launch_provider(sc); 26754ed854e8SPawel Jakub Dawidek if (sc->sc_rootmount != NULL) { 26764ed854e8SPawel Jakub Dawidek G_RAID3_DEBUG(1, "root_mount_rel[%u] %p", __LINE__, 26774ed854e8SPawel Jakub Dawidek sc->sc_rootmount); 26784ed854e8SPawel Jakub Dawidek root_mount_rel(sc->sc_rootmount); 26794ed854e8SPawel Jakub Dawidek sc->sc_rootmount = NULL; 26804ed854e8SPawel Jakub Dawidek } 26812d1661a5SPawel Jakub Dawidek break; 26822d1661a5SPawel Jakub Dawidek default: 26832d1661a5SPawel Jakub Dawidek KASSERT(1 == 0, ("Wrong device state (%s, %s).", sc->sc_name, 26842d1661a5SPawel Jakub Dawidek g_raid3_device_state2str(sc->sc_state))); 26852d1661a5SPawel Jakub Dawidek break; 26862d1661a5SPawel Jakub Dawidek } 26872d1661a5SPawel Jakub Dawidek } 26882d1661a5SPawel Jakub Dawidek 26892d1661a5SPawel Jakub Dawidek /* 26902d1661a5SPawel Jakub Dawidek * Update disk state and device state if needed. 26912d1661a5SPawel Jakub Dawidek */ 26922d1661a5SPawel Jakub Dawidek #define DISK_STATE_CHANGED() G_RAID3_DEBUG(1, \ 26932d1661a5SPawel Jakub Dawidek "Disk %s state changed from %s to %s (device %s).", \ 26942d1661a5SPawel Jakub Dawidek g_raid3_get_diskname(disk), \ 26952d1661a5SPawel Jakub Dawidek g_raid3_disk_state2str(disk->d_state), \ 26962d1661a5SPawel Jakub Dawidek g_raid3_disk_state2str(state), sc->sc_name) 26972d1661a5SPawel Jakub Dawidek static int 2698d97d5ee9SPawel Jakub Dawidek g_raid3_update_disk(struct g_raid3_disk *disk, u_int state) 26992d1661a5SPawel Jakub Dawidek { 27002d1661a5SPawel Jakub Dawidek struct g_raid3_softc *sc; 27012d1661a5SPawel Jakub Dawidek 27022d1661a5SPawel Jakub Dawidek sc = disk->d_softc; 27033650be51SPawel Jakub Dawidek sx_assert(&sc->sc_lock, SX_XLOCKED); 27043650be51SPawel Jakub Dawidek 27052d1661a5SPawel Jakub Dawidek again: 27062d1661a5SPawel Jakub Dawidek G_RAID3_DEBUG(3, "Changing disk %s state from %s to %s.", 27072d1661a5SPawel Jakub Dawidek g_raid3_get_diskname(disk), g_raid3_disk_state2str(disk->d_state), 27082d1661a5SPawel Jakub Dawidek g_raid3_disk_state2str(state)); 27092d1661a5SPawel Jakub Dawidek switch (state) { 27102d1661a5SPawel Jakub Dawidek case G_RAID3_DISK_STATE_NEW: 27112d1661a5SPawel Jakub Dawidek /* 27122d1661a5SPawel Jakub Dawidek * Possible scenarios: 27132d1661a5SPawel Jakub Dawidek * 1. New disk arrive. 27142d1661a5SPawel Jakub Dawidek */ 27152d1661a5SPawel Jakub Dawidek /* Previous state should be NONE. */ 27162d1661a5SPawel Jakub Dawidek KASSERT(disk->d_state == G_RAID3_DISK_STATE_NONE, 27172d1661a5SPawel Jakub Dawidek ("Wrong disk state (%s, %s).", g_raid3_get_diskname(disk), 27182d1661a5SPawel Jakub Dawidek g_raid3_disk_state2str(disk->d_state))); 27192d1661a5SPawel Jakub Dawidek DISK_STATE_CHANGED(); 27202d1661a5SPawel Jakub Dawidek 27212d1661a5SPawel Jakub Dawidek disk->d_state = state; 27220cca572eSJohn-Mark Gurney G_RAID3_DEBUG(1, "Device %s: provider %s detected.", 27232d1661a5SPawel Jakub Dawidek sc->sc_name, g_raid3_get_diskname(disk)); 27242d1661a5SPawel Jakub Dawidek if (sc->sc_state == G_RAID3_DEVICE_STATE_STARTING) 27252d1661a5SPawel Jakub Dawidek break; 27262d1661a5SPawel Jakub Dawidek KASSERT(sc->sc_state == G_RAID3_DEVICE_STATE_DEGRADED || 27272d1661a5SPawel Jakub Dawidek sc->sc_state == G_RAID3_DEVICE_STATE_COMPLETE, 27282d1661a5SPawel Jakub Dawidek ("Wrong device state (%s, %s, %s, %s).", sc->sc_name, 27292d1661a5SPawel Jakub Dawidek g_raid3_device_state2str(sc->sc_state), 27302d1661a5SPawel Jakub Dawidek g_raid3_get_diskname(disk), 27312d1661a5SPawel Jakub Dawidek g_raid3_disk_state2str(disk->d_state))); 27322d1661a5SPawel Jakub Dawidek state = g_raid3_determine_state(disk); 27332d1661a5SPawel Jakub Dawidek if (state != G_RAID3_DISK_STATE_NONE) 27342d1661a5SPawel Jakub Dawidek goto again; 27352d1661a5SPawel Jakub Dawidek break; 27362d1661a5SPawel Jakub Dawidek case G_RAID3_DISK_STATE_ACTIVE: 27372d1661a5SPawel Jakub Dawidek /* 27382d1661a5SPawel Jakub Dawidek * Possible scenarios: 27392d1661a5SPawel Jakub Dawidek * 1. New disk does not need synchronization. 27402d1661a5SPawel Jakub Dawidek * 2. Synchronization process finished successfully. 27412d1661a5SPawel Jakub Dawidek */ 27422d1661a5SPawel Jakub Dawidek KASSERT(sc->sc_state == G_RAID3_DEVICE_STATE_DEGRADED || 27432d1661a5SPawel Jakub Dawidek sc->sc_state == G_RAID3_DEVICE_STATE_COMPLETE, 27442d1661a5SPawel Jakub Dawidek ("Wrong device state (%s, %s, %s, %s).", sc->sc_name, 27452d1661a5SPawel Jakub Dawidek g_raid3_device_state2str(sc->sc_state), 27462d1661a5SPawel Jakub Dawidek g_raid3_get_diskname(disk), 27472d1661a5SPawel Jakub Dawidek g_raid3_disk_state2str(disk->d_state))); 27482d1661a5SPawel Jakub Dawidek /* Previous state should be NEW or SYNCHRONIZING. */ 27492d1661a5SPawel Jakub Dawidek KASSERT(disk->d_state == G_RAID3_DISK_STATE_NEW || 27502d1661a5SPawel Jakub Dawidek disk->d_state == G_RAID3_DISK_STATE_SYNCHRONIZING, 27512d1661a5SPawel Jakub Dawidek ("Wrong disk state (%s, %s).", g_raid3_get_diskname(disk), 27522d1661a5SPawel Jakub Dawidek g_raid3_disk_state2str(disk->d_state))); 27532d1661a5SPawel Jakub Dawidek DISK_STATE_CHANGED(); 27542d1661a5SPawel Jakub Dawidek 2755bf31327cSPawel Jakub Dawidek if (disk->d_state == G_RAID3_DISK_STATE_SYNCHRONIZING) { 27562d1661a5SPawel Jakub Dawidek disk->d_flags &= ~G_RAID3_DISK_FLAG_SYNCHRONIZING; 27572d1661a5SPawel Jakub Dawidek disk->d_flags &= ~G_RAID3_DISK_FLAG_FORCE_SYNC; 27582d1661a5SPawel Jakub Dawidek g_raid3_sync_stop(sc, 0); 27592d1661a5SPawel Jakub Dawidek } 27602d1661a5SPawel Jakub Dawidek disk->d_state = state; 27612d1661a5SPawel Jakub Dawidek disk->d_sync.ds_offset = 0; 27622d1661a5SPawel Jakub Dawidek disk->d_sync.ds_offset_done = 0; 27630962f942SPawel Jakub Dawidek g_raid3_update_idle(sc, disk); 2764bf31327cSPawel Jakub Dawidek g_raid3_update_metadata(disk); 27650cca572eSJohn-Mark Gurney G_RAID3_DEBUG(1, "Device %s: provider %s activated.", 27662d1661a5SPawel Jakub Dawidek sc->sc_name, g_raid3_get_diskname(disk)); 27672d1661a5SPawel Jakub Dawidek break; 27682d1661a5SPawel Jakub Dawidek case G_RAID3_DISK_STATE_STALE: 27692d1661a5SPawel Jakub Dawidek /* 27702d1661a5SPawel Jakub Dawidek * Possible scenarios: 27712d1661a5SPawel Jakub Dawidek * 1. Stale disk was connected. 27722d1661a5SPawel Jakub Dawidek */ 27732d1661a5SPawel Jakub Dawidek /* Previous state should be NEW. */ 27742d1661a5SPawel Jakub Dawidek KASSERT(disk->d_state == G_RAID3_DISK_STATE_NEW, 27752d1661a5SPawel Jakub Dawidek ("Wrong disk state (%s, %s).", g_raid3_get_diskname(disk), 27762d1661a5SPawel Jakub Dawidek g_raid3_disk_state2str(disk->d_state))); 27772d1661a5SPawel Jakub Dawidek KASSERT(sc->sc_state == G_RAID3_DEVICE_STATE_DEGRADED || 27782d1661a5SPawel Jakub Dawidek sc->sc_state == G_RAID3_DEVICE_STATE_COMPLETE, 27792d1661a5SPawel Jakub Dawidek ("Wrong device state (%s, %s, %s, %s).", sc->sc_name, 27802d1661a5SPawel Jakub Dawidek g_raid3_device_state2str(sc->sc_state), 27812d1661a5SPawel Jakub Dawidek g_raid3_get_diskname(disk), 27822d1661a5SPawel Jakub Dawidek g_raid3_disk_state2str(disk->d_state))); 27832d1661a5SPawel Jakub Dawidek /* 27842d1661a5SPawel Jakub Dawidek * STALE state is only possible if device is marked 27852d1661a5SPawel Jakub Dawidek * NOAUTOSYNC. 27862d1661a5SPawel Jakub Dawidek */ 27872d1661a5SPawel Jakub Dawidek KASSERT((sc->sc_flags & G_RAID3_DEVICE_FLAG_NOAUTOSYNC) != 0, 27882d1661a5SPawel Jakub Dawidek ("Wrong device state (%s, %s, %s, %s).", sc->sc_name, 27892d1661a5SPawel Jakub Dawidek g_raid3_device_state2str(sc->sc_state), 27902d1661a5SPawel Jakub Dawidek g_raid3_get_diskname(disk), 27912d1661a5SPawel Jakub Dawidek g_raid3_disk_state2str(disk->d_state))); 27922d1661a5SPawel Jakub Dawidek DISK_STATE_CHANGED(); 27932d1661a5SPawel Jakub Dawidek 27942d1661a5SPawel Jakub Dawidek disk->d_flags &= ~G_RAID3_DISK_FLAG_DIRTY; 27952d1661a5SPawel Jakub Dawidek disk->d_state = state; 27962d1661a5SPawel Jakub Dawidek g_raid3_update_metadata(disk); 27972d1661a5SPawel Jakub Dawidek G_RAID3_DEBUG(0, "Device %s: provider %s is stale.", 27982d1661a5SPawel Jakub Dawidek sc->sc_name, g_raid3_get_diskname(disk)); 27992d1661a5SPawel Jakub Dawidek break; 28002d1661a5SPawel Jakub Dawidek case G_RAID3_DISK_STATE_SYNCHRONIZING: 28012d1661a5SPawel Jakub Dawidek /* 28022d1661a5SPawel Jakub Dawidek * Possible scenarios: 28032d1661a5SPawel Jakub Dawidek * 1. Disk which needs synchronization was connected. 28042d1661a5SPawel Jakub Dawidek */ 28052d1661a5SPawel Jakub Dawidek /* Previous state should be NEW. */ 28062d1661a5SPawel Jakub Dawidek KASSERT(disk->d_state == G_RAID3_DISK_STATE_NEW, 28072d1661a5SPawel Jakub Dawidek ("Wrong disk state (%s, %s).", g_raid3_get_diskname(disk), 28082d1661a5SPawel Jakub Dawidek g_raid3_disk_state2str(disk->d_state))); 28092d1661a5SPawel Jakub Dawidek KASSERT(sc->sc_state == G_RAID3_DEVICE_STATE_DEGRADED || 28102d1661a5SPawel Jakub Dawidek sc->sc_state == G_RAID3_DEVICE_STATE_COMPLETE, 28112d1661a5SPawel Jakub Dawidek ("Wrong device state (%s, %s, %s, %s).", sc->sc_name, 28122d1661a5SPawel Jakub Dawidek g_raid3_device_state2str(sc->sc_state), 28132d1661a5SPawel Jakub Dawidek g_raid3_get_diskname(disk), 28142d1661a5SPawel Jakub Dawidek g_raid3_disk_state2str(disk->d_state))); 28152d1661a5SPawel Jakub Dawidek DISK_STATE_CHANGED(); 28162d1661a5SPawel Jakub Dawidek 28172d1661a5SPawel Jakub Dawidek if (disk->d_state == G_RAID3_DISK_STATE_NEW) 28182d1661a5SPawel Jakub Dawidek disk->d_flags &= ~G_RAID3_DISK_FLAG_DIRTY; 28192d1661a5SPawel Jakub Dawidek disk->d_state = state; 28202d1661a5SPawel Jakub Dawidek if (sc->sc_provider != NULL) { 28212d1661a5SPawel Jakub Dawidek g_raid3_sync_start(sc); 28222d1661a5SPawel Jakub Dawidek g_raid3_update_metadata(disk); 28232d1661a5SPawel Jakub Dawidek } 28242d1661a5SPawel Jakub Dawidek break; 28252d1661a5SPawel Jakub Dawidek case G_RAID3_DISK_STATE_DISCONNECTED: 28262d1661a5SPawel Jakub Dawidek /* 28272d1661a5SPawel Jakub Dawidek * Possible scenarios: 28282d1661a5SPawel Jakub Dawidek * 1. Device wasn't running yet, but disk disappear. 28292d1661a5SPawel Jakub Dawidek * 2. Disk was active and disapppear. 28302d1661a5SPawel Jakub Dawidek * 3. Disk disappear during synchronization process. 28312d1661a5SPawel Jakub Dawidek */ 28322d1661a5SPawel Jakub Dawidek if (sc->sc_state == G_RAID3_DEVICE_STATE_DEGRADED || 28332d1661a5SPawel Jakub Dawidek sc->sc_state == G_RAID3_DEVICE_STATE_COMPLETE) { 28342d1661a5SPawel Jakub Dawidek /* 28352d1661a5SPawel Jakub Dawidek * Previous state should be ACTIVE, STALE or 28362d1661a5SPawel Jakub Dawidek * SYNCHRONIZING. 28372d1661a5SPawel Jakub Dawidek */ 28382d1661a5SPawel Jakub Dawidek KASSERT(disk->d_state == G_RAID3_DISK_STATE_ACTIVE || 28392d1661a5SPawel Jakub Dawidek disk->d_state == G_RAID3_DISK_STATE_STALE || 28402d1661a5SPawel Jakub Dawidek disk->d_state == G_RAID3_DISK_STATE_SYNCHRONIZING, 28412d1661a5SPawel Jakub Dawidek ("Wrong disk state (%s, %s).", 28422d1661a5SPawel Jakub Dawidek g_raid3_get_diskname(disk), 28432d1661a5SPawel Jakub Dawidek g_raid3_disk_state2str(disk->d_state))); 28442d1661a5SPawel Jakub Dawidek } else if (sc->sc_state == G_RAID3_DEVICE_STATE_STARTING) { 28452d1661a5SPawel Jakub Dawidek /* Previous state should be NEW. */ 28462d1661a5SPawel Jakub Dawidek KASSERT(disk->d_state == G_RAID3_DISK_STATE_NEW, 28472d1661a5SPawel Jakub Dawidek ("Wrong disk state (%s, %s).", 28482d1661a5SPawel Jakub Dawidek g_raid3_get_diskname(disk), 28492d1661a5SPawel Jakub Dawidek g_raid3_disk_state2str(disk->d_state))); 28502d1661a5SPawel Jakub Dawidek /* 28512d1661a5SPawel Jakub Dawidek * Reset bumping syncid if disk disappeared in STARTING 28522d1661a5SPawel Jakub Dawidek * state. 28532d1661a5SPawel Jakub Dawidek */ 2854ea973705SPawel Jakub Dawidek if ((sc->sc_bump_id & G_RAID3_BUMP_SYNCID) != 0) 2855a245a548SPawel Jakub Dawidek sc->sc_bump_id &= ~G_RAID3_BUMP_SYNCID; 28562d1661a5SPawel Jakub Dawidek #ifdef INVARIANTS 28572d1661a5SPawel Jakub Dawidek } else { 28582d1661a5SPawel Jakub Dawidek KASSERT(1 == 0, ("Wrong device state (%s, %s, %s, %s).", 28592d1661a5SPawel Jakub Dawidek sc->sc_name, 28602d1661a5SPawel Jakub Dawidek g_raid3_device_state2str(sc->sc_state), 28612d1661a5SPawel Jakub Dawidek g_raid3_get_diskname(disk), 28622d1661a5SPawel Jakub Dawidek g_raid3_disk_state2str(disk->d_state))); 28632d1661a5SPawel Jakub Dawidek #endif 28642d1661a5SPawel Jakub Dawidek } 28652d1661a5SPawel Jakub Dawidek DISK_STATE_CHANGED(); 28662d1661a5SPawel Jakub Dawidek G_RAID3_DEBUG(0, "Device %s: provider %s disconnected.", 28672d1661a5SPawel Jakub Dawidek sc->sc_name, g_raid3_get_diskname(disk)); 28682d1661a5SPawel Jakub Dawidek 28692d1661a5SPawel Jakub Dawidek g_raid3_destroy_disk(disk); 28702d1661a5SPawel Jakub Dawidek break; 28712d1661a5SPawel Jakub Dawidek default: 28722d1661a5SPawel Jakub Dawidek KASSERT(1 == 0, ("Unknown state (%u).", state)); 28732d1661a5SPawel Jakub Dawidek break; 28742d1661a5SPawel Jakub Dawidek } 28752d1661a5SPawel Jakub Dawidek return (0); 28762d1661a5SPawel Jakub Dawidek } 28772d1661a5SPawel Jakub Dawidek #undef DISK_STATE_CHANGED 28782d1661a5SPawel Jakub Dawidek 2879ea973705SPawel Jakub Dawidek int 28802d1661a5SPawel Jakub Dawidek g_raid3_read_metadata(struct g_consumer *cp, struct g_raid3_metadata *md) 28812d1661a5SPawel Jakub Dawidek { 28822d1661a5SPawel Jakub Dawidek struct g_provider *pp; 28832d1661a5SPawel Jakub Dawidek u_char *buf; 28842d1661a5SPawel Jakub Dawidek int error; 28852d1661a5SPawel Jakub Dawidek 28862d1661a5SPawel Jakub Dawidek g_topology_assert(); 28872d1661a5SPawel Jakub Dawidek 28882d1661a5SPawel Jakub Dawidek error = g_access(cp, 1, 0, 0); 28892d1661a5SPawel Jakub Dawidek if (error != 0) 28902d1661a5SPawel Jakub Dawidek return (error); 28912d1661a5SPawel Jakub Dawidek pp = cp->provider; 28922d1661a5SPawel Jakub Dawidek g_topology_unlock(); 28932d1661a5SPawel Jakub Dawidek /* Metadata are stored on last sector. */ 28942d1661a5SPawel Jakub Dawidek buf = g_read_data(cp, pp->mediasize - pp->sectorsize, pp->sectorsize, 28952d1661a5SPawel Jakub Dawidek &error); 28962d1661a5SPawel Jakub Dawidek g_topology_lock(); 28972d1661a5SPawel Jakub Dawidek g_access(cp, -1, 0, 0); 28988a4a44b5SMaxim Sobolev if (buf == NULL) { 2899a245a548SPawel Jakub Dawidek G_RAID3_DEBUG(1, "Cannot read metadata from %s (error=%d).", 2900a245a548SPawel Jakub Dawidek cp->provider->name, error); 29012d1661a5SPawel Jakub Dawidek return (error); 29022d1661a5SPawel Jakub Dawidek } 29032d1661a5SPawel Jakub Dawidek 29042d1661a5SPawel Jakub Dawidek /* Decode metadata. */ 29052d1661a5SPawel Jakub Dawidek error = raid3_metadata_decode(buf, md); 29062d1661a5SPawel Jakub Dawidek g_free(buf); 29072d1661a5SPawel Jakub Dawidek if (strcmp(md->md_magic, G_RAID3_MAGIC) != 0) 29082d1661a5SPawel Jakub Dawidek return (EINVAL); 2909a245a548SPawel Jakub Dawidek if (md->md_version > G_RAID3_VERSION) { 2910a245a548SPawel Jakub Dawidek G_RAID3_DEBUG(0, 2911a245a548SPawel Jakub Dawidek "Kernel module is too old to handle metadata from %s.", 2912a245a548SPawel Jakub Dawidek cp->provider->name); 2913a245a548SPawel Jakub Dawidek return (EINVAL); 2914a245a548SPawel Jakub Dawidek } 29152d1661a5SPawel Jakub Dawidek if (error != 0) { 29162d1661a5SPawel Jakub Dawidek G_RAID3_DEBUG(1, "MD5 metadata hash mismatch for provider %s.", 29172d1661a5SPawel Jakub Dawidek cp->provider->name); 29182d1661a5SPawel Jakub Dawidek return (error); 29192d1661a5SPawel Jakub Dawidek } 292095959703SAndrey V. Elsukov if (md->md_sectorsize > MAXPHYS) { 292195959703SAndrey V. Elsukov G_RAID3_DEBUG(0, "The blocksize is too big."); 292295959703SAndrey V. Elsukov return (EINVAL); 292395959703SAndrey V. Elsukov } 29242d1661a5SPawel Jakub Dawidek 29252d1661a5SPawel Jakub Dawidek return (0); 29262d1661a5SPawel Jakub Dawidek } 29272d1661a5SPawel Jakub Dawidek 29282d1661a5SPawel Jakub Dawidek static int 29292d1661a5SPawel Jakub Dawidek g_raid3_check_metadata(struct g_raid3_softc *sc, struct g_provider *pp, 29302d1661a5SPawel Jakub Dawidek struct g_raid3_metadata *md) 29312d1661a5SPawel Jakub Dawidek { 29322d1661a5SPawel Jakub Dawidek 29332d1661a5SPawel Jakub Dawidek if (md->md_no >= sc->sc_ndisks) { 29342d1661a5SPawel Jakub Dawidek G_RAID3_DEBUG(1, "Invalid disk %s number (no=%u), skipping.", 29352d1661a5SPawel Jakub Dawidek pp->name, md->md_no); 29362d1661a5SPawel Jakub Dawidek return (EINVAL); 29372d1661a5SPawel Jakub Dawidek } 29382d1661a5SPawel Jakub Dawidek if (sc->sc_disks[md->md_no].d_state != G_RAID3_DISK_STATE_NODISK) { 29392d1661a5SPawel Jakub Dawidek G_RAID3_DEBUG(1, "Disk %s (no=%u) already exists, skipping.", 29402d1661a5SPawel Jakub Dawidek pp->name, md->md_no); 29412d1661a5SPawel Jakub Dawidek return (EEXIST); 29422d1661a5SPawel Jakub Dawidek } 29432d1661a5SPawel Jakub Dawidek if (md->md_all != sc->sc_ndisks) { 29442d1661a5SPawel Jakub Dawidek G_RAID3_DEBUG(1, 29452d1661a5SPawel Jakub Dawidek "Invalid '%s' field on disk %s (device %s), skipping.", 29462d1661a5SPawel Jakub Dawidek "md_all", pp->name, sc->sc_name); 29472d1661a5SPawel Jakub Dawidek return (EINVAL); 29482d1661a5SPawel Jakub Dawidek } 294911b2174fSPawel Jakub Dawidek if ((md->md_mediasize % md->md_sectorsize) != 0) { 295011b2174fSPawel Jakub Dawidek G_RAID3_DEBUG(1, "Invalid metadata (mediasize %% sectorsize != " 295111b2174fSPawel Jakub Dawidek "0) on disk %s (device %s), skipping.", pp->name, 295211b2174fSPawel Jakub Dawidek sc->sc_name); 295311b2174fSPawel Jakub Dawidek return (EINVAL); 295411b2174fSPawel Jakub Dawidek } 29552d1661a5SPawel Jakub Dawidek if (md->md_mediasize != sc->sc_mediasize) { 29562d1661a5SPawel Jakub Dawidek G_RAID3_DEBUG(1, 29572d1661a5SPawel Jakub Dawidek "Invalid '%s' field on disk %s (device %s), skipping.", 29582d1661a5SPawel Jakub Dawidek "md_mediasize", pp->name, sc->sc_name); 29592d1661a5SPawel Jakub Dawidek return (EINVAL); 29602d1661a5SPawel Jakub Dawidek } 29612d1661a5SPawel Jakub Dawidek if ((md->md_mediasize % (sc->sc_ndisks - 1)) != 0) { 29622d1661a5SPawel Jakub Dawidek G_RAID3_DEBUG(1, 29632d1661a5SPawel Jakub Dawidek "Invalid '%s' field on disk %s (device %s), skipping.", 29642d1661a5SPawel Jakub Dawidek "md_mediasize", pp->name, sc->sc_name); 29652d1661a5SPawel Jakub Dawidek return (EINVAL); 29662d1661a5SPawel Jakub Dawidek } 29672d1661a5SPawel Jakub Dawidek if ((sc->sc_mediasize / (sc->sc_ndisks - 1)) > pp->mediasize) { 29682d1661a5SPawel Jakub Dawidek G_RAID3_DEBUG(1, 29692d1661a5SPawel Jakub Dawidek "Invalid size of disk %s (device %s), skipping.", pp->name, 29702d1661a5SPawel Jakub Dawidek sc->sc_name); 29712d1661a5SPawel Jakub Dawidek return (EINVAL); 29722d1661a5SPawel Jakub Dawidek } 29732d1661a5SPawel Jakub Dawidek if ((md->md_sectorsize / pp->sectorsize) < sc->sc_ndisks - 1) { 29742d1661a5SPawel Jakub Dawidek G_RAID3_DEBUG(1, 29752d1661a5SPawel Jakub Dawidek "Invalid '%s' field on disk %s (device %s), skipping.", 29762d1661a5SPawel Jakub Dawidek "md_sectorsize", pp->name, sc->sc_name); 29772d1661a5SPawel Jakub Dawidek return (EINVAL); 29782d1661a5SPawel Jakub Dawidek } 29792d1661a5SPawel Jakub Dawidek if (md->md_sectorsize != sc->sc_sectorsize) { 29802d1661a5SPawel Jakub Dawidek G_RAID3_DEBUG(1, 29812d1661a5SPawel Jakub Dawidek "Invalid '%s' field on disk %s (device %s), skipping.", 29822d1661a5SPawel Jakub Dawidek "md_sectorsize", pp->name, sc->sc_name); 29832d1661a5SPawel Jakub Dawidek return (EINVAL); 29842d1661a5SPawel Jakub Dawidek } 29852d1661a5SPawel Jakub Dawidek if ((sc->sc_sectorsize % pp->sectorsize) != 0) { 29862d1661a5SPawel Jakub Dawidek G_RAID3_DEBUG(1, 29872d1661a5SPawel Jakub Dawidek "Invalid sector size of disk %s (device %s), skipping.", 29882d1661a5SPawel Jakub Dawidek pp->name, sc->sc_name); 29892d1661a5SPawel Jakub Dawidek return (EINVAL); 29902d1661a5SPawel Jakub Dawidek } 29912d1661a5SPawel Jakub Dawidek if ((md->md_mflags & ~G_RAID3_DEVICE_FLAG_MASK) != 0) { 29922d1661a5SPawel Jakub Dawidek G_RAID3_DEBUG(1, 29932d1661a5SPawel Jakub Dawidek "Invalid device flags on disk %s (device %s), skipping.", 29942d1661a5SPawel Jakub Dawidek pp->name, sc->sc_name); 29952d1661a5SPawel Jakub Dawidek return (EINVAL); 29962d1661a5SPawel Jakub Dawidek } 2997dba915cfSPawel Jakub Dawidek if ((md->md_mflags & G_RAID3_DEVICE_FLAG_VERIFY) != 0 && 2998dba915cfSPawel Jakub Dawidek (md->md_mflags & G_RAID3_DEVICE_FLAG_ROUND_ROBIN) != 0) { 2999dba915cfSPawel Jakub Dawidek /* 3000dba915cfSPawel Jakub Dawidek * VERIFY and ROUND-ROBIN options are mutally exclusive. 3001dba915cfSPawel Jakub Dawidek */ 3002dba915cfSPawel Jakub Dawidek G_RAID3_DEBUG(1, "Both VERIFY and ROUND-ROBIN flags exist on " 3003dba915cfSPawel Jakub Dawidek "disk %s (device %s), skipping.", pp->name, sc->sc_name); 3004dba915cfSPawel Jakub Dawidek return (EINVAL); 3005dba915cfSPawel Jakub Dawidek } 30062d1661a5SPawel Jakub Dawidek if ((md->md_dflags & ~G_RAID3_DISK_FLAG_MASK) != 0) { 30072d1661a5SPawel Jakub Dawidek G_RAID3_DEBUG(1, 30082d1661a5SPawel Jakub Dawidek "Invalid disk flags on disk %s (device %s), skipping.", 30092d1661a5SPawel Jakub Dawidek pp->name, sc->sc_name); 30102d1661a5SPawel Jakub Dawidek return (EINVAL); 30112d1661a5SPawel Jakub Dawidek } 30122d1661a5SPawel Jakub Dawidek return (0); 30132d1661a5SPawel Jakub Dawidek } 30142d1661a5SPawel Jakub Dawidek 3015ea973705SPawel Jakub Dawidek int 30162d1661a5SPawel Jakub Dawidek g_raid3_add_disk(struct g_raid3_softc *sc, struct g_provider *pp, 30172d1661a5SPawel Jakub Dawidek struct g_raid3_metadata *md) 30182d1661a5SPawel Jakub Dawidek { 30192d1661a5SPawel Jakub Dawidek struct g_raid3_disk *disk; 30202d1661a5SPawel Jakub Dawidek int error; 30212d1661a5SPawel Jakub Dawidek 30223650be51SPawel Jakub Dawidek g_topology_assert_not(); 30232d1661a5SPawel Jakub Dawidek G_RAID3_DEBUG(2, "Adding disk %s.", pp->name); 30242d1661a5SPawel Jakub Dawidek 30252d1661a5SPawel Jakub Dawidek error = g_raid3_check_metadata(sc, pp, md); 30262d1661a5SPawel Jakub Dawidek if (error != 0) 30272d1661a5SPawel Jakub Dawidek return (error); 3028a245a548SPawel Jakub Dawidek if (sc->sc_state != G_RAID3_DEVICE_STATE_STARTING && 3029a245a548SPawel Jakub Dawidek md->md_genid < sc->sc_genid) { 3030a245a548SPawel Jakub Dawidek G_RAID3_DEBUG(0, "Component %s (device %s) broken, skipping.", 3031a245a548SPawel Jakub Dawidek pp->name, sc->sc_name); 3032a245a548SPawel Jakub Dawidek return (EINVAL); 3033a245a548SPawel Jakub Dawidek } 30342d1661a5SPawel Jakub Dawidek disk = g_raid3_init_disk(sc, pp, md, &error); 30352d1661a5SPawel Jakub Dawidek if (disk == NULL) 30362d1661a5SPawel Jakub Dawidek return (error); 30372d1661a5SPawel Jakub Dawidek error = g_raid3_event_send(disk, G_RAID3_DISK_STATE_NEW, 30382d1661a5SPawel Jakub Dawidek G_RAID3_EVENT_WAIT); 3039a245a548SPawel Jakub Dawidek if (error != 0) 30402d1661a5SPawel Jakub Dawidek return (error); 3041a245a548SPawel Jakub Dawidek if (md->md_version < G_RAID3_VERSION) { 3042a245a548SPawel Jakub Dawidek G_RAID3_DEBUG(0, "Upgrading metadata on %s (v%d->v%d).", 3043a245a548SPawel Jakub Dawidek pp->name, md->md_version, G_RAID3_VERSION); 3044a245a548SPawel Jakub Dawidek g_raid3_update_metadata(disk); 3045a245a548SPawel Jakub Dawidek } 3046a245a548SPawel Jakub Dawidek return (0); 30472d1661a5SPawel Jakub Dawidek } 30482d1661a5SPawel Jakub Dawidek 3049712fe9bdSPawel Jakub Dawidek static void 3050712fe9bdSPawel Jakub Dawidek g_raid3_destroy_delayed(void *arg, int flag) 3051712fe9bdSPawel Jakub Dawidek { 3052712fe9bdSPawel Jakub Dawidek struct g_raid3_softc *sc; 3053712fe9bdSPawel Jakub Dawidek int error; 3054712fe9bdSPawel Jakub Dawidek 3055712fe9bdSPawel Jakub Dawidek if (flag == EV_CANCEL) { 3056712fe9bdSPawel Jakub Dawidek G_RAID3_DEBUG(1, "Destroying canceled."); 3057712fe9bdSPawel Jakub Dawidek return; 3058712fe9bdSPawel Jakub Dawidek } 3059712fe9bdSPawel Jakub Dawidek sc = arg; 3060712fe9bdSPawel Jakub Dawidek g_topology_unlock(); 3061712fe9bdSPawel Jakub Dawidek sx_xlock(&sc->sc_lock); 3062712fe9bdSPawel Jakub Dawidek KASSERT((sc->sc_flags & G_RAID3_DEVICE_FLAG_DESTROY) == 0, 3063712fe9bdSPawel Jakub Dawidek ("DESTROY flag set on %s.", sc->sc_name)); 3064712fe9bdSPawel Jakub Dawidek KASSERT((sc->sc_flags & G_RAID3_DEVICE_FLAG_DESTROYING) != 0, 3065712fe9bdSPawel Jakub Dawidek ("DESTROYING flag not set on %s.", sc->sc_name)); 3066712fe9bdSPawel Jakub Dawidek G_RAID3_DEBUG(0, "Destroying %s (delayed).", sc->sc_name); 3067712fe9bdSPawel Jakub Dawidek error = g_raid3_destroy(sc, G_RAID3_DESTROY_SOFT); 3068712fe9bdSPawel Jakub Dawidek if (error != 0) { 3069712fe9bdSPawel Jakub Dawidek G_RAID3_DEBUG(0, "Cannot destroy %s.", sc->sc_name); 3070712fe9bdSPawel Jakub Dawidek sx_xunlock(&sc->sc_lock); 3071712fe9bdSPawel Jakub Dawidek } 3072712fe9bdSPawel Jakub Dawidek g_topology_lock(); 3073712fe9bdSPawel Jakub Dawidek } 3074712fe9bdSPawel Jakub Dawidek 30752d1661a5SPawel Jakub Dawidek static int 30762d1661a5SPawel Jakub Dawidek g_raid3_access(struct g_provider *pp, int acr, int acw, int ace) 30772d1661a5SPawel Jakub Dawidek { 30782d1661a5SPawel Jakub Dawidek struct g_raid3_softc *sc; 3079712fe9bdSPawel Jakub Dawidek int dcr, dcw, dce, error = 0; 30802d1661a5SPawel Jakub Dawidek 30812d1661a5SPawel Jakub Dawidek g_topology_assert(); 30822d1661a5SPawel Jakub Dawidek G_RAID3_DEBUG(2, "Access request for %s: r%dw%de%d.", pp->name, acr, 30832d1661a5SPawel Jakub Dawidek acw, ace); 30842d1661a5SPawel Jakub Dawidek 30851f7fec3cSPawel Jakub Dawidek sc = pp->geom->softc; 30861f7fec3cSPawel Jakub Dawidek if (sc == NULL && acr <= 0 && acw <= 0 && ace <= 0) 30871f7fec3cSPawel Jakub Dawidek return (0); 30881f7fec3cSPawel Jakub Dawidek KASSERT(sc != NULL, ("NULL softc (provider=%s).", pp->name)); 30891f7fec3cSPawel Jakub Dawidek 30902d1661a5SPawel Jakub Dawidek dcr = pp->acr + acr; 30912d1661a5SPawel Jakub Dawidek dcw = pp->acw + acw; 30922d1661a5SPawel Jakub Dawidek dce = pp->ace + ace; 30932d1661a5SPawel Jakub Dawidek 30943650be51SPawel Jakub Dawidek g_topology_unlock(); 30953650be51SPawel Jakub Dawidek sx_xlock(&sc->sc_lock); 3096712fe9bdSPawel Jakub Dawidek if ((sc->sc_flags & G_RAID3_DEVICE_FLAG_DESTROY) != 0 || 30973650be51SPawel Jakub Dawidek g_raid3_ndisks(sc, G_RAID3_DISK_STATE_ACTIVE) < sc->sc_ndisks - 1) { 30983650be51SPawel Jakub Dawidek if (acr > 0 || acw > 0 || ace > 0) 30993650be51SPawel Jakub Dawidek error = ENXIO; 31003650be51SPawel Jakub Dawidek goto end; 31012d1661a5SPawel Jakub Dawidek } 3102f62c1a47SAlexander Motin if (dcw == 0) 31033650be51SPawel Jakub Dawidek g_raid3_idle(sc, dcw); 3104712fe9bdSPawel Jakub Dawidek if ((sc->sc_flags & G_RAID3_DEVICE_FLAG_DESTROYING) != 0) { 3105712fe9bdSPawel Jakub Dawidek if (acr > 0 || acw > 0 || ace > 0) { 3106712fe9bdSPawel Jakub Dawidek error = ENXIO; 3107712fe9bdSPawel Jakub Dawidek goto end; 3108712fe9bdSPawel Jakub Dawidek } 3109712fe9bdSPawel Jakub Dawidek if (dcr == 0 && dcw == 0 && dce == 0) { 3110712fe9bdSPawel Jakub Dawidek g_post_event(g_raid3_destroy_delayed, sc, M_WAITOK, 3111712fe9bdSPawel Jakub Dawidek sc, NULL); 3112712fe9bdSPawel Jakub Dawidek } 3113712fe9bdSPawel Jakub Dawidek } 31143650be51SPawel Jakub Dawidek end: 31153650be51SPawel Jakub Dawidek sx_xunlock(&sc->sc_lock); 31163650be51SPawel Jakub Dawidek g_topology_lock(); 31173650be51SPawel Jakub Dawidek return (error); 31182d1661a5SPawel Jakub Dawidek } 31192d1661a5SPawel Jakub Dawidek 31202d1661a5SPawel Jakub Dawidek static struct g_geom * 31212d1661a5SPawel Jakub Dawidek g_raid3_create(struct g_class *mp, const struct g_raid3_metadata *md) 31222d1661a5SPawel Jakub Dawidek { 31232d1661a5SPawel Jakub Dawidek struct g_raid3_softc *sc; 31242d1661a5SPawel Jakub Dawidek struct g_geom *gp; 31252d1661a5SPawel Jakub Dawidek int error, timeout; 31262d1661a5SPawel Jakub Dawidek u_int n; 31272d1661a5SPawel Jakub Dawidek 31282d1661a5SPawel Jakub Dawidek g_topology_assert(); 31292d1661a5SPawel Jakub Dawidek G_RAID3_DEBUG(1, "Creating device %s (id=%u).", md->md_name, md->md_id); 31302d1661a5SPawel Jakub Dawidek 31312d1661a5SPawel Jakub Dawidek /* One disk is minimum. */ 31322d1661a5SPawel Jakub Dawidek if (md->md_all < 1) 31332d1661a5SPawel Jakub Dawidek return (NULL); 31342d1661a5SPawel Jakub Dawidek /* 31352d1661a5SPawel Jakub Dawidek * Action geom. 31362d1661a5SPawel Jakub Dawidek */ 31372d1661a5SPawel Jakub Dawidek gp = g_new_geomf(mp, "%s", md->md_name); 31382d1661a5SPawel Jakub Dawidek sc = malloc(sizeof(*sc), M_RAID3, M_WAITOK | M_ZERO); 31392d1661a5SPawel Jakub Dawidek sc->sc_disks = malloc(sizeof(struct g_raid3_disk) * md->md_all, M_RAID3, 31402d1661a5SPawel Jakub Dawidek M_WAITOK | M_ZERO); 31412d1661a5SPawel Jakub Dawidek gp->start = g_raid3_start; 31422d1661a5SPawel Jakub Dawidek gp->orphan = g_raid3_orphan; 31432d1661a5SPawel Jakub Dawidek gp->access = g_raid3_access; 31442d1661a5SPawel Jakub Dawidek gp->dumpconf = g_raid3_dumpconf; 31452d1661a5SPawel Jakub Dawidek 31462d1661a5SPawel Jakub Dawidek sc->sc_id = md->md_id; 31472d1661a5SPawel Jakub Dawidek sc->sc_mediasize = md->md_mediasize; 31482d1661a5SPawel Jakub Dawidek sc->sc_sectorsize = md->md_sectorsize; 31492d1661a5SPawel Jakub Dawidek sc->sc_ndisks = md->md_all; 3150f5a2f7feSPawel Jakub Dawidek sc->sc_round_robin = 0; 31512d1661a5SPawel Jakub Dawidek sc->sc_flags = md->md_mflags; 3152a245a548SPawel Jakub Dawidek sc->sc_bump_id = 0; 31530962f942SPawel Jakub Dawidek sc->sc_idle = 1; 315401f1f41cSPawel Jakub Dawidek sc->sc_last_write = time_uptime; 31550962f942SPawel Jakub Dawidek sc->sc_writes = 0; 3156afd05d74SPawel Jakub Dawidek for (n = 0; n < sc->sc_ndisks; n++) { 3157afd05d74SPawel Jakub Dawidek sc->sc_disks[n].d_softc = sc; 3158afd05d74SPawel Jakub Dawidek sc->sc_disks[n].d_no = n; 31592d1661a5SPawel Jakub Dawidek sc->sc_disks[n].d_state = G_RAID3_DISK_STATE_NODISK; 3160afd05d74SPawel Jakub Dawidek } 31613650be51SPawel Jakub Dawidek sx_init(&sc->sc_lock, "graid3:lock"); 31622d1661a5SPawel Jakub Dawidek bioq_init(&sc->sc_queue); 31632d1661a5SPawel Jakub Dawidek mtx_init(&sc->sc_queue_mtx, "graid3:queue", NULL, MTX_DEF); 31643650be51SPawel Jakub Dawidek bioq_init(&sc->sc_regular_delayed); 31653650be51SPawel Jakub Dawidek bioq_init(&sc->sc_inflight); 31663650be51SPawel Jakub Dawidek bioq_init(&sc->sc_sync_delayed); 31672d1661a5SPawel Jakub Dawidek TAILQ_INIT(&sc->sc_events); 31682d1661a5SPawel Jakub Dawidek mtx_init(&sc->sc_events_mtx, "graid3:events", NULL, MTX_DEF); 31692d1661a5SPawel Jakub Dawidek callout_init(&sc->sc_callout, CALLOUT_MPSAFE); 31702d1661a5SPawel Jakub Dawidek sc->sc_state = G_RAID3_DEVICE_STATE_STARTING; 31712d1661a5SPawel Jakub Dawidek gp->softc = sc; 31722d1661a5SPawel Jakub Dawidek sc->sc_geom = gp; 31732d1661a5SPawel Jakub Dawidek sc->sc_provider = NULL; 31742d1661a5SPawel Jakub Dawidek /* 31752d1661a5SPawel Jakub Dawidek * Synchronization geom. 31762d1661a5SPawel Jakub Dawidek */ 31772d1661a5SPawel Jakub Dawidek gp = g_new_geomf(mp, "%s.sync", md->md_name); 31782d1661a5SPawel Jakub Dawidek gp->softc = sc; 31792d1661a5SPawel Jakub Dawidek gp->orphan = g_raid3_orphan; 31802d1661a5SPawel Jakub Dawidek sc->sc_sync.ds_geom = gp; 31813650be51SPawel Jakub Dawidek 3182ed940a82SPawel Jakub Dawidek if (!g_raid3_use_malloc) { 3183ed940a82SPawel Jakub Dawidek sc->sc_zones[G_RAID3_ZONE_64K].sz_zone = uma_zcreate("gr3:64k", 3184ed940a82SPawel Jakub Dawidek 65536, g_raid3_uma_ctor, g_raid3_uma_dtor, NULL, NULL, 3185ed940a82SPawel Jakub Dawidek UMA_ALIGN_PTR, 0); 31863650be51SPawel Jakub Dawidek sc->sc_zones[G_RAID3_ZONE_64K].sz_inuse = 0; 31873650be51SPawel Jakub Dawidek sc->sc_zones[G_RAID3_ZONE_64K].sz_max = g_raid3_n64k; 31883650be51SPawel Jakub Dawidek sc->sc_zones[G_RAID3_ZONE_64K].sz_requested = 31893650be51SPawel Jakub Dawidek sc->sc_zones[G_RAID3_ZONE_64K].sz_failed = 0; 3190ed940a82SPawel Jakub Dawidek sc->sc_zones[G_RAID3_ZONE_16K].sz_zone = uma_zcreate("gr3:16k", 3191ed940a82SPawel Jakub Dawidek 16384, g_raid3_uma_ctor, g_raid3_uma_dtor, NULL, NULL, 3192ed940a82SPawel Jakub Dawidek UMA_ALIGN_PTR, 0); 31933650be51SPawel Jakub Dawidek sc->sc_zones[G_RAID3_ZONE_16K].sz_inuse = 0; 31943650be51SPawel Jakub Dawidek sc->sc_zones[G_RAID3_ZONE_16K].sz_max = g_raid3_n16k; 31953650be51SPawel Jakub Dawidek sc->sc_zones[G_RAID3_ZONE_16K].sz_requested = 31963650be51SPawel Jakub Dawidek sc->sc_zones[G_RAID3_ZONE_16K].sz_failed = 0; 3197ed940a82SPawel Jakub Dawidek sc->sc_zones[G_RAID3_ZONE_4K].sz_zone = uma_zcreate("gr3:4k", 3198ed940a82SPawel Jakub Dawidek 4096, g_raid3_uma_ctor, g_raid3_uma_dtor, NULL, NULL, 3199ed940a82SPawel Jakub Dawidek UMA_ALIGN_PTR, 0); 32003650be51SPawel Jakub Dawidek sc->sc_zones[G_RAID3_ZONE_4K].sz_inuse = 0; 32013650be51SPawel Jakub Dawidek sc->sc_zones[G_RAID3_ZONE_4K].sz_max = g_raid3_n4k; 32023650be51SPawel Jakub Dawidek sc->sc_zones[G_RAID3_ZONE_4K].sz_requested = 32033650be51SPawel Jakub Dawidek sc->sc_zones[G_RAID3_ZONE_4K].sz_failed = 0; 3204ed940a82SPawel Jakub Dawidek } 32053650be51SPawel Jakub Dawidek 32063745c395SJulian Elischer error = kproc_create(g_raid3_worker, sc, &sc->sc_worker, 0, 0, 32072d1661a5SPawel Jakub Dawidek "g_raid3 %s", md->md_name); 32082d1661a5SPawel Jakub Dawidek if (error != 0) { 32092d1661a5SPawel Jakub Dawidek G_RAID3_DEBUG(1, "Cannot create kernel thread for %s.", 32102d1661a5SPawel Jakub Dawidek sc->sc_name); 3211ed940a82SPawel Jakub Dawidek if (!g_raid3_use_malloc) { 32123650be51SPawel Jakub Dawidek uma_zdestroy(sc->sc_zones[G_RAID3_ZONE_64K].sz_zone); 32133650be51SPawel Jakub Dawidek uma_zdestroy(sc->sc_zones[G_RAID3_ZONE_16K].sz_zone); 32143650be51SPawel Jakub Dawidek uma_zdestroy(sc->sc_zones[G_RAID3_ZONE_4K].sz_zone); 3215ed940a82SPawel Jakub Dawidek } 32162d1661a5SPawel Jakub Dawidek g_destroy_geom(sc->sc_sync.ds_geom); 32172d1661a5SPawel Jakub Dawidek mtx_destroy(&sc->sc_events_mtx); 32182d1661a5SPawel Jakub Dawidek mtx_destroy(&sc->sc_queue_mtx); 32193650be51SPawel Jakub Dawidek sx_destroy(&sc->sc_lock); 32202d1661a5SPawel Jakub Dawidek g_destroy_geom(sc->sc_geom); 32212d1661a5SPawel Jakub Dawidek free(sc->sc_disks, M_RAID3); 32222d1661a5SPawel Jakub Dawidek free(sc, M_RAID3); 32232d1661a5SPawel Jakub Dawidek return (NULL); 32242d1661a5SPawel Jakub Dawidek } 32252d1661a5SPawel Jakub Dawidek 32260cca572eSJohn-Mark Gurney G_RAID3_DEBUG(1, "Device %s created (%u components, id=%u).", 32270cca572eSJohn-Mark Gurney sc->sc_name, sc->sc_ndisks, sc->sc_id); 32282d1661a5SPawel Jakub Dawidek 3229853a10a5SAndrew Thompson sc->sc_rootmount = root_mount_hold("GRAID3"); 32304ed854e8SPawel Jakub Dawidek G_RAID3_DEBUG(1, "root_mount_hold %p", sc->sc_rootmount); 32314ed854e8SPawel Jakub Dawidek 32322d1661a5SPawel Jakub Dawidek /* 32332d1661a5SPawel Jakub Dawidek * Run timeout. 32342d1661a5SPawel Jakub Dawidek */ 32352d1661a5SPawel Jakub Dawidek timeout = atomic_load_acq_int(&g_raid3_timeout); 32362d1661a5SPawel Jakub Dawidek callout_reset(&sc->sc_callout, timeout * hz, g_raid3_go, sc); 32372d1661a5SPawel Jakub Dawidek return (sc->sc_geom); 32382d1661a5SPawel Jakub Dawidek } 32392d1661a5SPawel Jakub Dawidek 32402d1661a5SPawel Jakub Dawidek int 3241712fe9bdSPawel Jakub Dawidek g_raid3_destroy(struct g_raid3_softc *sc, int how) 32422d1661a5SPawel Jakub Dawidek { 32432d1661a5SPawel Jakub Dawidek struct g_provider *pp; 32442d1661a5SPawel Jakub Dawidek 32453650be51SPawel Jakub Dawidek g_topology_assert_not(); 32462d1661a5SPawel Jakub Dawidek if (sc == NULL) 32472d1661a5SPawel Jakub Dawidek return (ENXIO); 32483650be51SPawel Jakub Dawidek sx_assert(&sc->sc_lock, SX_XLOCKED); 32493650be51SPawel Jakub Dawidek 32502d1661a5SPawel Jakub Dawidek pp = sc->sc_provider; 32512d1661a5SPawel Jakub Dawidek if (pp != NULL && (pp->acr != 0 || pp->acw != 0 || pp->ace != 0)) { 3252712fe9bdSPawel Jakub Dawidek switch (how) { 3253712fe9bdSPawel Jakub Dawidek case G_RAID3_DESTROY_SOFT: 32542d1661a5SPawel Jakub Dawidek G_RAID3_DEBUG(1, 32552d1661a5SPawel Jakub Dawidek "Device %s is still open (r%dw%de%d).", pp->name, 32562d1661a5SPawel Jakub Dawidek pp->acr, pp->acw, pp->ace); 32572d1661a5SPawel Jakub Dawidek return (EBUSY); 3258712fe9bdSPawel Jakub Dawidek case G_RAID3_DESTROY_DELAYED: 3259712fe9bdSPawel Jakub Dawidek G_RAID3_DEBUG(1, 3260712fe9bdSPawel Jakub Dawidek "Device %s will be destroyed on last close.", 3261712fe9bdSPawel Jakub Dawidek pp->name); 3262712fe9bdSPawel Jakub Dawidek if (sc->sc_syncdisk != NULL) 3263712fe9bdSPawel Jakub Dawidek g_raid3_sync_stop(sc, 1); 3264712fe9bdSPawel Jakub Dawidek sc->sc_flags |= G_RAID3_DEVICE_FLAG_DESTROYING; 3265712fe9bdSPawel Jakub Dawidek return (EBUSY); 3266712fe9bdSPawel Jakub Dawidek case G_RAID3_DESTROY_HARD: 3267712fe9bdSPawel Jakub Dawidek G_RAID3_DEBUG(1, "Device %s is still open, so it " 3268712fe9bdSPawel Jakub Dawidek "can't be definitely removed.", pp->name); 3269712fe9bdSPawel Jakub Dawidek break; 32702d1661a5SPawel Jakub Dawidek } 32712d1661a5SPawel Jakub Dawidek } 32722d1661a5SPawel Jakub Dawidek 327318486a5eSPawel Jakub Dawidek g_topology_lock(); 327418486a5eSPawel Jakub Dawidek if (sc->sc_geom->softc == NULL) { 327518486a5eSPawel Jakub Dawidek g_topology_unlock(); 327618486a5eSPawel Jakub Dawidek return (0); 327718486a5eSPawel Jakub Dawidek } 327818486a5eSPawel Jakub Dawidek sc->sc_geom->softc = NULL; 327918486a5eSPawel Jakub Dawidek sc->sc_sync.ds_geom->softc = NULL; 328018486a5eSPawel Jakub Dawidek g_topology_unlock(); 328118486a5eSPawel Jakub Dawidek 32822d1661a5SPawel Jakub Dawidek sc->sc_flags |= G_RAID3_DEVICE_FLAG_DESTROY; 32832d1661a5SPawel Jakub Dawidek sc->sc_flags |= G_RAID3_DEVICE_FLAG_WAIT; 32842d1661a5SPawel Jakub Dawidek G_RAID3_DEBUG(4, "%s: Waking up %p.", __func__, sc); 32853650be51SPawel Jakub Dawidek sx_xunlock(&sc->sc_lock); 32862d1661a5SPawel Jakub Dawidek mtx_lock(&sc->sc_queue_mtx); 32872d1661a5SPawel Jakub Dawidek wakeup(sc); 32882d1661a5SPawel Jakub Dawidek wakeup(&sc->sc_queue); 32892d1661a5SPawel Jakub Dawidek mtx_unlock(&sc->sc_queue_mtx); 32902d1661a5SPawel Jakub Dawidek G_RAID3_DEBUG(4, "%s: Sleeping %p.", __func__, &sc->sc_worker); 32912d1661a5SPawel Jakub Dawidek while (sc->sc_worker != NULL) 32922d1661a5SPawel Jakub Dawidek tsleep(&sc->sc_worker, PRIBIO, "r3:destroy", hz / 5); 32932d1661a5SPawel Jakub Dawidek G_RAID3_DEBUG(4, "%s: Woken up %p.", __func__, &sc->sc_worker); 32943650be51SPawel Jakub Dawidek sx_xlock(&sc->sc_lock); 32952d1661a5SPawel Jakub Dawidek g_raid3_destroy_device(sc); 32962d1661a5SPawel Jakub Dawidek free(sc->sc_disks, M_RAID3); 32972d1661a5SPawel Jakub Dawidek free(sc, M_RAID3); 32982d1661a5SPawel Jakub Dawidek return (0); 32992d1661a5SPawel Jakub Dawidek } 33002d1661a5SPawel Jakub Dawidek 33012d1661a5SPawel Jakub Dawidek static void 33022d1661a5SPawel Jakub Dawidek g_raid3_taste_orphan(struct g_consumer *cp) 33032d1661a5SPawel Jakub Dawidek { 33042d1661a5SPawel Jakub Dawidek 33052d1661a5SPawel Jakub Dawidek KASSERT(1 == 0, ("%s called while tasting %s.", __func__, 33062d1661a5SPawel Jakub Dawidek cp->provider->name)); 33072d1661a5SPawel Jakub Dawidek } 33082d1661a5SPawel Jakub Dawidek 33092d1661a5SPawel Jakub Dawidek static struct g_geom * 33102d1661a5SPawel Jakub Dawidek g_raid3_taste(struct g_class *mp, struct g_provider *pp, int flags __unused) 33112d1661a5SPawel Jakub Dawidek { 33122d1661a5SPawel Jakub Dawidek struct g_raid3_metadata md; 33132d1661a5SPawel Jakub Dawidek struct g_raid3_softc *sc; 33142d1661a5SPawel Jakub Dawidek struct g_consumer *cp; 33152d1661a5SPawel Jakub Dawidek struct g_geom *gp; 33162d1661a5SPawel Jakub Dawidek int error; 33172d1661a5SPawel Jakub Dawidek 33182d1661a5SPawel Jakub Dawidek g_topology_assert(); 33192d1661a5SPawel Jakub Dawidek g_trace(G_T_TOPOLOGY, "%s(%s, %s)", __func__, mp->name, pp->name); 33202d1661a5SPawel Jakub Dawidek G_RAID3_DEBUG(2, "Tasting %s.", pp->name); 33212d1661a5SPawel Jakub Dawidek 33222d1661a5SPawel Jakub Dawidek gp = g_new_geomf(mp, "raid3:taste"); 33232d1661a5SPawel Jakub Dawidek /* This orphan function should be never called. */ 33242d1661a5SPawel Jakub Dawidek gp->orphan = g_raid3_taste_orphan; 33252d1661a5SPawel Jakub Dawidek cp = g_new_consumer(gp); 33262d1661a5SPawel Jakub Dawidek g_attach(cp, pp); 33272d1661a5SPawel Jakub Dawidek error = g_raid3_read_metadata(cp, &md); 33282d1661a5SPawel Jakub Dawidek g_detach(cp); 33292d1661a5SPawel Jakub Dawidek g_destroy_consumer(cp); 33302d1661a5SPawel Jakub Dawidek g_destroy_geom(gp); 33312d1661a5SPawel Jakub Dawidek if (error != 0) 33322d1661a5SPawel Jakub Dawidek return (NULL); 33332d1661a5SPawel Jakub Dawidek gp = NULL; 33342d1661a5SPawel Jakub Dawidek 333590f2be24SAlexander Motin if (md.md_provider[0] != '\0' && 333690f2be24SAlexander Motin !g_compare_names(md.md_provider, pp->name)) 33372d1661a5SPawel Jakub Dawidek return (NULL); 3338e6890985SPawel Jakub Dawidek if (md.md_provsize != 0 && md.md_provsize != pp->mediasize) 3339e6890985SPawel Jakub Dawidek return (NULL); 33402d1661a5SPawel Jakub Dawidek if (g_raid3_debug >= 2) 33412d1661a5SPawel Jakub Dawidek raid3_metadata_dump(&md); 33422d1661a5SPawel Jakub Dawidek 33432d1661a5SPawel Jakub Dawidek /* 33442d1661a5SPawel Jakub Dawidek * Let's check if device already exists. 33452d1661a5SPawel Jakub Dawidek */ 334645d5e85aSPawel Jakub Dawidek sc = NULL; 33472d1661a5SPawel Jakub Dawidek LIST_FOREACH(gp, &mp->geom, geom) { 33482d1661a5SPawel Jakub Dawidek sc = gp->softc; 33492d1661a5SPawel Jakub Dawidek if (sc == NULL) 33502d1661a5SPawel Jakub Dawidek continue; 33512d1661a5SPawel Jakub Dawidek if (sc->sc_sync.ds_geom == gp) 33522d1661a5SPawel Jakub Dawidek continue; 33532d1661a5SPawel Jakub Dawidek if (strcmp(md.md_name, sc->sc_name) != 0) 33542d1661a5SPawel Jakub Dawidek continue; 33552d1661a5SPawel Jakub Dawidek if (md.md_id != sc->sc_id) { 33562d1661a5SPawel Jakub Dawidek G_RAID3_DEBUG(0, "Device %s already configured.", 33572d1661a5SPawel Jakub Dawidek sc->sc_name); 33582d1661a5SPawel Jakub Dawidek return (NULL); 33592d1661a5SPawel Jakub Dawidek } 33602d1661a5SPawel Jakub Dawidek break; 33612d1661a5SPawel Jakub Dawidek } 33622d1661a5SPawel Jakub Dawidek if (gp == NULL) { 33632d1661a5SPawel Jakub Dawidek gp = g_raid3_create(mp, &md); 33642d1661a5SPawel Jakub Dawidek if (gp == NULL) { 33652d1661a5SPawel Jakub Dawidek G_RAID3_DEBUG(0, "Cannot create device %s.", 33662d1661a5SPawel Jakub Dawidek md.md_name); 33672d1661a5SPawel Jakub Dawidek return (NULL); 33682d1661a5SPawel Jakub Dawidek } 33692d1661a5SPawel Jakub Dawidek sc = gp->softc; 33702d1661a5SPawel Jakub Dawidek } 33712d1661a5SPawel Jakub Dawidek G_RAID3_DEBUG(1, "Adding disk %s to %s.", pp->name, gp->name); 33723650be51SPawel Jakub Dawidek g_topology_unlock(); 33733650be51SPawel Jakub Dawidek sx_xlock(&sc->sc_lock); 33742d1661a5SPawel Jakub Dawidek error = g_raid3_add_disk(sc, pp, &md); 33752d1661a5SPawel Jakub Dawidek if (error != 0) { 33762d1661a5SPawel Jakub Dawidek G_RAID3_DEBUG(0, "Cannot add disk %s to %s (error=%d).", 33772d1661a5SPawel Jakub Dawidek pp->name, gp->name, error); 33782d1661a5SPawel Jakub Dawidek if (g_raid3_ndisks(sc, G_RAID3_DISK_STATE_NODISK) == 33792d1661a5SPawel Jakub Dawidek sc->sc_ndisks) { 3380712fe9bdSPawel Jakub Dawidek g_cancel_event(sc); 33813525bb6bSPawel Jakub Dawidek g_raid3_destroy(sc, G_RAID3_DESTROY_HARD); 33823650be51SPawel Jakub Dawidek g_topology_lock(); 33832d1661a5SPawel Jakub Dawidek return (NULL); 33842d1661a5SPawel Jakub Dawidek } 33853650be51SPawel Jakub Dawidek gp = NULL; 33863650be51SPawel Jakub Dawidek } 33873650be51SPawel Jakub Dawidek sx_xunlock(&sc->sc_lock); 33883650be51SPawel Jakub Dawidek g_topology_lock(); 33892d1661a5SPawel Jakub Dawidek return (gp); 33902d1661a5SPawel Jakub Dawidek } 33912d1661a5SPawel Jakub Dawidek 33922d1661a5SPawel Jakub Dawidek static int 33932d1661a5SPawel Jakub Dawidek g_raid3_destroy_geom(struct gctl_req *req __unused, struct g_class *mp __unused, 33942d1661a5SPawel Jakub Dawidek struct g_geom *gp) 33952d1661a5SPawel Jakub Dawidek { 33963650be51SPawel Jakub Dawidek struct g_raid3_softc *sc; 33973650be51SPawel Jakub Dawidek int error; 33982d1661a5SPawel Jakub Dawidek 33993650be51SPawel Jakub Dawidek g_topology_unlock(); 34003650be51SPawel Jakub Dawidek sc = gp->softc; 34013650be51SPawel Jakub Dawidek sx_xlock(&sc->sc_lock); 3402712fe9bdSPawel Jakub Dawidek g_cancel_event(sc); 34033525bb6bSPawel Jakub Dawidek error = g_raid3_destroy(gp->softc, G_RAID3_DESTROY_SOFT); 34043650be51SPawel Jakub Dawidek if (error != 0) 34053650be51SPawel Jakub Dawidek sx_xunlock(&sc->sc_lock); 34063650be51SPawel Jakub Dawidek g_topology_lock(); 34073650be51SPawel Jakub Dawidek return (error); 34082d1661a5SPawel Jakub Dawidek } 34092d1661a5SPawel Jakub Dawidek 34102d1661a5SPawel Jakub Dawidek static void 34112d1661a5SPawel Jakub Dawidek g_raid3_dumpconf(struct sbuf *sb, const char *indent, struct g_geom *gp, 34122d1661a5SPawel Jakub Dawidek struct g_consumer *cp, struct g_provider *pp) 34132d1661a5SPawel Jakub Dawidek { 34142d1661a5SPawel Jakub Dawidek struct g_raid3_softc *sc; 34152d1661a5SPawel Jakub Dawidek 34162d1661a5SPawel Jakub Dawidek g_topology_assert(); 34172d1661a5SPawel Jakub Dawidek 34182d1661a5SPawel Jakub Dawidek sc = gp->softc; 34192d1661a5SPawel Jakub Dawidek if (sc == NULL) 34202d1661a5SPawel Jakub Dawidek return; 34212d1661a5SPawel Jakub Dawidek /* Skip synchronization geom. */ 34222d1661a5SPawel Jakub Dawidek if (gp == sc->sc_sync.ds_geom) 34232d1661a5SPawel Jakub Dawidek return; 34242d1661a5SPawel Jakub Dawidek if (pp != NULL) { 34252d1661a5SPawel Jakub Dawidek /* Nothing here. */ 34262d1661a5SPawel Jakub Dawidek } else if (cp != NULL) { 34272d1661a5SPawel Jakub Dawidek struct g_raid3_disk *disk; 34282d1661a5SPawel Jakub Dawidek 34292d1661a5SPawel Jakub Dawidek disk = cp->private; 34302d1661a5SPawel Jakub Dawidek if (disk == NULL) 34312d1661a5SPawel Jakub Dawidek return; 34323650be51SPawel Jakub Dawidek g_topology_unlock(); 34333650be51SPawel Jakub Dawidek sx_xlock(&sc->sc_lock); 34342d1661a5SPawel Jakub Dawidek sbuf_printf(sb, "%s<Type>", indent); 34352d1661a5SPawel Jakub Dawidek if (disk->d_no == sc->sc_ndisks - 1) 34362d1661a5SPawel Jakub Dawidek sbuf_printf(sb, "PARITY"); 34372d1661a5SPawel Jakub Dawidek else 34382d1661a5SPawel Jakub Dawidek sbuf_printf(sb, "DATA"); 34392d1661a5SPawel Jakub Dawidek sbuf_printf(sb, "</Type>\n"); 34402d1661a5SPawel Jakub Dawidek sbuf_printf(sb, "%s<Number>%u</Number>\n", indent, 34412d1661a5SPawel Jakub Dawidek (u_int)disk->d_no); 34422d1661a5SPawel Jakub Dawidek if (disk->d_state == G_RAID3_DISK_STATE_SYNCHRONIZING) { 34432d1661a5SPawel Jakub Dawidek sbuf_printf(sb, "%s<Synchronized>", indent); 34443650be51SPawel Jakub Dawidek if (disk->d_sync.ds_offset == 0) 34452d1661a5SPawel Jakub Dawidek sbuf_printf(sb, "0%%"); 34462d1661a5SPawel Jakub Dawidek else { 34472d1661a5SPawel Jakub Dawidek sbuf_printf(sb, "%u%%", 34483650be51SPawel Jakub Dawidek (u_int)((disk->d_sync.ds_offset * 100) / 3449c0d68b6eSPawel Jakub Dawidek (sc->sc_mediasize / (sc->sc_ndisks - 1)))); 34502d1661a5SPawel Jakub Dawidek } 34512d1661a5SPawel Jakub Dawidek sbuf_printf(sb, "</Synchronized>\n"); 34524a7f7b10SGleb Smirnoff if (disk->d_sync.ds_offset > 0) { 34534a7f7b10SGleb Smirnoff sbuf_printf(sb, "%s<BytesSynced>%jd" 34544a7f7b10SGleb Smirnoff "</BytesSynced>\n", indent, 34554a7f7b10SGleb Smirnoff (intmax_t)disk->d_sync.ds_offset); 34564a7f7b10SGleb Smirnoff } 34572d1661a5SPawel Jakub Dawidek } 34582d1661a5SPawel Jakub Dawidek sbuf_printf(sb, "%s<SyncID>%u</SyncID>\n", indent, 34592d1661a5SPawel Jakub Dawidek disk->d_sync.ds_syncid); 3460a245a548SPawel Jakub Dawidek sbuf_printf(sb, "%s<GenID>%u</GenID>\n", indent, disk->d_genid); 34612d1661a5SPawel Jakub Dawidek sbuf_printf(sb, "%s<Flags>", indent); 34622d1661a5SPawel Jakub Dawidek if (disk->d_flags == 0) 34632d1661a5SPawel Jakub Dawidek sbuf_printf(sb, "NONE"); 34642d1661a5SPawel Jakub Dawidek else { 34652d1661a5SPawel Jakub Dawidek int first = 1; 34662d1661a5SPawel Jakub Dawidek 34672d1661a5SPawel Jakub Dawidek #define ADD_FLAG(flag, name) do { \ 34682d1661a5SPawel Jakub Dawidek if ((disk->d_flags & (flag)) != 0) { \ 34692d1661a5SPawel Jakub Dawidek if (!first) \ 34702d1661a5SPawel Jakub Dawidek sbuf_printf(sb, ", "); \ 34712d1661a5SPawel Jakub Dawidek else \ 34722d1661a5SPawel Jakub Dawidek first = 0; \ 34732d1661a5SPawel Jakub Dawidek sbuf_printf(sb, name); \ 34742d1661a5SPawel Jakub Dawidek } \ 34752d1661a5SPawel Jakub Dawidek } while (0) 34762d1661a5SPawel Jakub Dawidek ADD_FLAG(G_RAID3_DISK_FLAG_DIRTY, "DIRTY"); 34772d1661a5SPawel Jakub Dawidek ADD_FLAG(G_RAID3_DISK_FLAG_HARDCODED, "HARDCODED"); 34782d1661a5SPawel Jakub Dawidek ADD_FLAG(G_RAID3_DISK_FLAG_SYNCHRONIZING, 34792d1661a5SPawel Jakub Dawidek "SYNCHRONIZING"); 34802d1661a5SPawel Jakub Dawidek ADD_FLAG(G_RAID3_DISK_FLAG_FORCE_SYNC, "FORCE_SYNC"); 34813aae74ecSPawel Jakub Dawidek ADD_FLAG(G_RAID3_DISK_FLAG_BROKEN, "BROKEN"); 34822d1661a5SPawel Jakub Dawidek #undef ADD_FLAG 34832d1661a5SPawel Jakub Dawidek } 34842d1661a5SPawel Jakub Dawidek sbuf_printf(sb, "</Flags>\n"); 34852d1661a5SPawel Jakub Dawidek sbuf_printf(sb, "%s<State>%s</State>\n", indent, 34862d1661a5SPawel Jakub Dawidek g_raid3_disk_state2str(disk->d_state)); 34873650be51SPawel Jakub Dawidek sx_xunlock(&sc->sc_lock); 34883650be51SPawel Jakub Dawidek g_topology_lock(); 34892d1661a5SPawel Jakub Dawidek } else { 34903650be51SPawel Jakub Dawidek g_topology_unlock(); 34913650be51SPawel Jakub Dawidek sx_xlock(&sc->sc_lock); 3492ed940a82SPawel Jakub Dawidek if (!g_raid3_use_malloc) { 3493ed940a82SPawel Jakub Dawidek sbuf_printf(sb, 3494ed940a82SPawel Jakub Dawidek "%s<Zone4kRequested>%u</Zone4kRequested>\n", indent, 3495ed940a82SPawel Jakub Dawidek sc->sc_zones[G_RAID3_ZONE_4K].sz_requested); 3496ed940a82SPawel Jakub Dawidek sbuf_printf(sb, 3497ed940a82SPawel Jakub Dawidek "%s<Zone4kFailed>%u</Zone4kFailed>\n", indent, 3498ed940a82SPawel Jakub Dawidek sc->sc_zones[G_RAID3_ZONE_4K].sz_failed); 3499ed940a82SPawel Jakub Dawidek sbuf_printf(sb, 3500ed940a82SPawel Jakub Dawidek "%s<Zone16kRequested>%u</Zone16kRequested>\n", indent, 3501ed940a82SPawel Jakub Dawidek sc->sc_zones[G_RAID3_ZONE_16K].sz_requested); 3502ed940a82SPawel Jakub Dawidek sbuf_printf(sb, 3503ed940a82SPawel Jakub Dawidek "%s<Zone16kFailed>%u</Zone16kFailed>\n", indent, 3504ed940a82SPawel Jakub Dawidek sc->sc_zones[G_RAID3_ZONE_16K].sz_failed); 3505ed940a82SPawel Jakub Dawidek sbuf_printf(sb, 3506ed940a82SPawel Jakub Dawidek "%s<Zone64kRequested>%u</Zone64kRequested>\n", indent, 3507ed940a82SPawel Jakub Dawidek sc->sc_zones[G_RAID3_ZONE_64K].sz_requested); 3508ed940a82SPawel Jakub Dawidek sbuf_printf(sb, 3509ed940a82SPawel Jakub Dawidek "%s<Zone64kFailed>%u</Zone64kFailed>\n", indent, 3510ed940a82SPawel Jakub Dawidek sc->sc_zones[G_RAID3_ZONE_64K].sz_failed); 3511ed940a82SPawel Jakub Dawidek } 35122d1661a5SPawel Jakub Dawidek sbuf_printf(sb, "%s<ID>%u</ID>\n", indent, (u_int)sc->sc_id); 35132d1661a5SPawel Jakub Dawidek sbuf_printf(sb, "%s<SyncID>%u</SyncID>\n", indent, sc->sc_syncid); 3514a245a548SPawel Jakub Dawidek sbuf_printf(sb, "%s<GenID>%u</GenID>\n", indent, sc->sc_genid); 35152d1661a5SPawel Jakub Dawidek sbuf_printf(sb, "%s<Flags>", indent); 35162d1661a5SPawel Jakub Dawidek if (sc->sc_flags == 0) 35172d1661a5SPawel Jakub Dawidek sbuf_printf(sb, "NONE"); 35182d1661a5SPawel Jakub Dawidek else { 35192d1661a5SPawel Jakub Dawidek int first = 1; 35202d1661a5SPawel Jakub Dawidek 35212d1661a5SPawel Jakub Dawidek #define ADD_FLAG(flag, name) do { \ 35222d1661a5SPawel Jakub Dawidek if ((sc->sc_flags & (flag)) != 0) { \ 35232d1661a5SPawel Jakub Dawidek if (!first) \ 35242d1661a5SPawel Jakub Dawidek sbuf_printf(sb, ", "); \ 35252d1661a5SPawel Jakub Dawidek else \ 35262d1661a5SPawel Jakub Dawidek first = 0; \ 35272d1661a5SPawel Jakub Dawidek sbuf_printf(sb, name); \ 35282d1661a5SPawel Jakub Dawidek } \ 35292d1661a5SPawel Jakub Dawidek } while (0) 3530501250baSPawel Jakub Dawidek ADD_FLAG(G_RAID3_DEVICE_FLAG_NOFAILSYNC, "NOFAILSYNC"); 35312d1661a5SPawel Jakub Dawidek ADD_FLAG(G_RAID3_DEVICE_FLAG_NOAUTOSYNC, "NOAUTOSYNC"); 3532f5a2f7feSPawel Jakub Dawidek ADD_FLAG(G_RAID3_DEVICE_FLAG_ROUND_ROBIN, 3533f5a2f7feSPawel Jakub Dawidek "ROUND-ROBIN"); 3534dba915cfSPawel Jakub Dawidek ADD_FLAG(G_RAID3_DEVICE_FLAG_VERIFY, "VERIFY"); 35352d1661a5SPawel Jakub Dawidek #undef ADD_FLAG 35362d1661a5SPawel Jakub Dawidek } 35372d1661a5SPawel Jakub Dawidek sbuf_printf(sb, "</Flags>\n"); 35382d1661a5SPawel Jakub Dawidek sbuf_printf(sb, "%s<Components>%u</Components>\n", indent, 35392d1661a5SPawel Jakub Dawidek sc->sc_ndisks); 354028b31df7SPawel Jakub Dawidek sbuf_printf(sb, "%s<State>%s</State>\n", indent, 354128b31df7SPawel Jakub Dawidek g_raid3_device_state2str(sc->sc_state)); 35423650be51SPawel Jakub Dawidek sx_xunlock(&sc->sc_lock); 35433650be51SPawel Jakub Dawidek g_topology_lock(); 35442d1661a5SPawel Jakub Dawidek } 35452d1661a5SPawel Jakub Dawidek } 35462d1661a5SPawel Jakub Dawidek 35479da3072cSPawel Jakub Dawidek static void 3548f62c1a47SAlexander Motin g_raid3_shutdown_post_sync(void *arg, int howto) 35499da3072cSPawel Jakub Dawidek { 35509da3072cSPawel Jakub Dawidek struct g_class *mp; 35519da3072cSPawel Jakub Dawidek struct g_geom *gp, *gp2; 35523650be51SPawel Jakub Dawidek struct g_raid3_softc *sc; 3553712fe9bdSPawel Jakub Dawidek int error; 35549da3072cSPawel Jakub Dawidek 35559da3072cSPawel Jakub Dawidek mp = arg; 3556fdc3c6ceSPawel Jakub Dawidek DROP_GIANT(); 35579da3072cSPawel Jakub Dawidek g_topology_lock(); 3558f62c1a47SAlexander Motin g_raid3_shutdown = 1; 35599da3072cSPawel Jakub Dawidek LIST_FOREACH_SAFE(gp, &mp->geom, geom, gp2) { 35603650be51SPawel Jakub Dawidek if ((sc = gp->softc) == NULL) 35619da3072cSPawel Jakub Dawidek continue; 3562712fe9bdSPawel Jakub Dawidek /* Skip synchronization geom. */ 3563712fe9bdSPawel Jakub Dawidek if (gp == sc->sc_sync.ds_geom) 3564712fe9bdSPawel Jakub Dawidek continue; 35653650be51SPawel Jakub Dawidek g_topology_unlock(); 35663650be51SPawel Jakub Dawidek sx_xlock(&sc->sc_lock); 3567f62c1a47SAlexander Motin g_raid3_idle(sc, -1); 3568712fe9bdSPawel Jakub Dawidek g_cancel_event(sc); 3569712fe9bdSPawel Jakub Dawidek error = g_raid3_destroy(sc, G_RAID3_DESTROY_DELAYED); 3570712fe9bdSPawel Jakub Dawidek if (error != 0) 35713650be51SPawel Jakub Dawidek sx_xunlock(&sc->sc_lock); 35723650be51SPawel Jakub Dawidek g_topology_lock(); 35733650be51SPawel Jakub Dawidek } 35743650be51SPawel Jakub Dawidek g_topology_unlock(); 35753650be51SPawel Jakub Dawidek PICKUP_GIANT(); 35763650be51SPawel Jakub Dawidek } 35773650be51SPawel Jakub Dawidek 35783650be51SPawel Jakub Dawidek static void 35799da3072cSPawel Jakub Dawidek g_raid3_init(struct g_class *mp) 35809da3072cSPawel Jakub Dawidek { 35819da3072cSPawel Jakub Dawidek 3582f62c1a47SAlexander Motin g_raid3_post_sync = EVENTHANDLER_REGISTER(shutdown_post_sync, 3583f62c1a47SAlexander Motin g_raid3_shutdown_post_sync, mp, SHUTDOWN_PRI_FIRST); 3584f62c1a47SAlexander Motin if (g_raid3_post_sync == NULL) 35859da3072cSPawel Jakub Dawidek G_RAID3_DEBUG(0, "Warning! Cannot register shutdown event."); 35869da3072cSPawel Jakub Dawidek } 35879da3072cSPawel Jakub Dawidek 35889da3072cSPawel Jakub Dawidek static void 35899da3072cSPawel Jakub Dawidek g_raid3_fini(struct g_class *mp) 35909da3072cSPawel Jakub Dawidek { 35919da3072cSPawel Jakub Dawidek 3592f62c1a47SAlexander Motin if (g_raid3_post_sync != NULL) 3593f62c1a47SAlexander Motin EVENTHANDLER_DEREGISTER(shutdown_post_sync, g_raid3_post_sync); 35949da3072cSPawel Jakub Dawidek } 35959da3072cSPawel Jakub Dawidek 35962d1661a5SPawel Jakub Dawidek DECLARE_GEOM_CLASS(g_raid3_class, g_raid3); 3597