16e790746SPaolo Bonzini /* 26e790746SPaolo Bonzini * Virtio Block Device 36e790746SPaolo Bonzini * 46e790746SPaolo Bonzini * Copyright IBM, Corp. 2007 56e790746SPaolo Bonzini * 66e790746SPaolo Bonzini * Authors: 76e790746SPaolo Bonzini * Anthony Liguori <aliguori@us.ibm.com> 86e790746SPaolo Bonzini * 96e790746SPaolo Bonzini * This work is licensed under the terms of the GNU GPL, version 2. See 106e790746SPaolo Bonzini * the COPYING file in the top-level directory. 116e790746SPaolo Bonzini * 126e790746SPaolo Bonzini */ 136e790746SPaolo Bonzini 146e790746SPaolo Bonzini #include "qemu-common.h" 15827805a2SFam Zheng #include "qemu/iov.h" 166e790746SPaolo Bonzini #include "qemu/error-report.h" 176e790746SPaolo Bonzini #include "trace.h" 186e790746SPaolo Bonzini #include "hw/block/block.h" 196e790746SPaolo Bonzini #include "sysemu/blockdev.h" 206e790746SPaolo Bonzini #include "hw/virtio/virtio-blk.h" 216e790746SPaolo Bonzini #ifdef CONFIG_VIRTIO_BLK_DATA_PLANE 226e790746SPaolo Bonzini # include "dataplane/virtio-blk.h" 2384db52d0SStefan Hajnoczi # include "migration/migration.h" 246e790746SPaolo Bonzini #endif 256e790746SPaolo Bonzini #include "block/scsi.h" 266e790746SPaolo Bonzini #ifdef __linux__ 276e790746SPaolo Bonzini # include <scsi/sg.h> 286e790746SPaolo Bonzini #endif 296e790746SPaolo Bonzini #include "hw/virtio/virtio-bus.h" 30783d1897SRusty Russell #include "hw/virtio/virtio-access.h" 316e790746SPaolo Bonzini 32f897bf75SStefan Hajnoczi VirtIOBlockReq *virtio_blk_alloc_request(VirtIOBlock *s) 33671ec3f0SFam Zheng { 34869d66afSStefan Hajnoczi VirtIOBlockReq *req = g_slice_new(VirtIOBlockReq); 35671ec3f0SFam Zheng req->dev = s; 36869d66afSStefan Hajnoczi req->qiov.size = 0; 37869d66afSStefan Hajnoczi req->next = NULL; 38671ec3f0SFam Zheng return req; 39671ec3f0SFam Zheng } 40671ec3f0SFam Zheng 41f897bf75SStefan Hajnoczi void virtio_blk_free_request(VirtIOBlockReq *req) 42671ec3f0SFam Zheng { 43671ec3f0SFam Zheng if (req) { 44671ec3f0SFam Zheng g_slice_free(VirtIOBlockReq, req); 45671ec3f0SFam Zheng } 46671ec3f0SFam Zheng } 47671ec3f0SFam Zheng 48bf4bd461SFam Zheng static void virtio_blk_complete_request(VirtIOBlockReq *req, 49bf4bd461SFam Zheng unsigned char status) 506e790746SPaolo Bonzini { 516e790746SPaolo Bonzini VirtIOBlock *s = req->dev; 526e790746SPaolo Bonzini VirtIODevice *vdev = VIRTIO_DEVICE(s); 536e790746SPaolo Bonzini 546e790746SPaolo Bonzini trace_virtio_blk_req_complete(req, status); 556e790746SPaolo Bonzini 566e790746SPaolo Bonzini stb_p(&req->in->status, status); 57f897bf75SStefan Hajnoczi virtqueue_push(s->vq, &req->elem, req->qiov.size + sizeof(*req->in)); 586e790746SPaolo Bonzini virtio_notify(vdev, s->vq); 596e790746SPaolo Bonzini } 606e790746SPaolo Bonzini 61bf4bd461SFam Zheng static void virtio_blk_req_complete(VirtIOBlockReq *req, unsigned char status) 62bf4bd461SFam Zheng { 63bf4bd461SFam Zheng req->dev->complete_request(req, status); 64bf4bd461SFam Zheng } 65bf4bd461SFam Zheng 666e790746SPaolo Bonzini static int virtio_blk_handle_rw_error(VirtIOBlockReq *req, int error, 676e790746SPaolo Bonzini bool is_read) 686e790746SPaolo Bonzini { 696e790746SPaolo Bonzini BlockErrorAction action = bdrv_get_error_action(req->dev->bs, is_read, error); 706e790746SPaolo Bonzini VirtIOBlock *s = req->dev; 716e790746SPaolo Bonzini 72a589569fSWenchao Xia if (action == BLOCK_ERROR_ACTION_STOP) { 736e790746SPaolo Bonzini req->next = s->rq; 746e790746SPaolo Bonzini s->rq = req; 75a589569fSWenchao Xia } else if (action == BLOCK_ERROR_ACTION_REPORT) { 766e790746SPaolo Bonzini virtio_blk_req_complete(req, VIRTIO_BLK_S_IOERR); 776e790746SPaolo Bonzini bdrv_acct_done(s->bs, &req->acct); 78671ec3f0SFam Zheng virtio_blk_free_request(req); 796e790746SPaolo Bonzini } 806e790746SPaolo Bonzini 816e790746SPaolo Bonzini bdrv_error_action(s->bs, action, is_read, error); 82a589569fSWenchao Xia return action != BLOCK_ERROR_ACTION_IGNORE; 836e790746SPaolo Bonzini } 846e790746SPaolo Bonzini 856e790746SPaolo Bonzini static void virtio_blk_rw_complete(void *opaque, int ret) 866e790746SPaolo Bonzini { 876e790746SPaolo Bonzini VirtIOBlockReq *req = opaque; 886e790746SPaolo Bonzini 896e790746SPaolo Bonzini trace_virtio_blk_rw_complete(req, ret); 906e790746SPaolo Bonzini 916e790746SPaolo Bonzini if (ret) { 92783d1897SRusty Russell int p = virtio_ldl_p(VIRTIO_DEVICE(req->dev), &req->out.type); 93783d1897SRusty Russell bool is_read = !(p & VIRTIO_BLK_T_OUT); 946e790746SPaolo Bonzini if (virtio_blk_handle_rw_error(req, -ret, is_read)) 956e790746SPaolo Bonzini return; 966e790746SPaolo Bonzini } 976e790746SPaolo Bonzini 986e790746SPaolo Bonzini virtio_blk_req_complete(req, VIRTIO_BLK_S_OK); 996e790746SPaolo Bonzini bdrv_acct_done(req->dev->bs, &req->acct); 100671ec3f0SFam Zheng virtio_blk_free_request(req); 1016e790746SPaolo Bonzini } 1026e790746SPaolo Bonzini 1036e790746SPaolo Bonzini static void virtio_blk_flush_complete(void *opaque, int ret) 1046e790746SPaolo Bonzini { 1056e790746SPaolo Bonzini VirtIOBlockReq *req = opaque; 1066e790746SPaolo Bonzini 1076e790746SPaolo Bonzini if (ret) { 1086e790746SPaolo Bonzini if (virtio_blk_handle_rw_error(req, -ret, 0)) { 1096e790746SPaolo Bonzini return; 1106e790746SPaolo Bonzini } 1116e790746SPaolo Bonzini } 1126e790746SPaolo Bonzini 1136e790746SPaolo Bonzini virtio_blk_req_complete(req, VIRTIO_BLK_S_OK); 1146e790746SPaolo Bonzini bdrv_acct_done(req->dev->bs, &req->acct); 115671ec3f0SFam Zheng virtio_blk_free_request(req); 1166e790746SPaolo Bonzini } 1176e790746SPaolo Bonzini 1186e790746SPaolo Bonzini static VirtIOBlockReq *virtio_blk_get_request(VirtIOBlock *s) 1196e790746SPaolo Bonzini { 1206e790746SPaolo Bonzini VirtIOBlockReq *req = virtio_blk_alloc_request(s); 1216e790746SPaolo Bonzini 122f897bf75SStefan Hajnoczi if (!virtqueue_pop(s->vq, &req->elem)) { 123671ec3f0SFam Zheng virtio_blk_free_request(req); 1246e790746SPaolo Bonzini return NULL; 1256e790746SPaolo Bonzini } 1266e790746SPaolo Bonzini 1276e790746SPaolo Bonzini return req; 1286e790746SPaolo Bonzini } 1296e790746SPaolo Bonzini 1305a05cbeeSFam Zheng int virtio_blk_handle_scsi_req(VirtIOBlock *blk, 1315a05cbeeSFam Zheng VirtQueueElement *elem) 1326e790746SPaolo Bonzini { 1336e790746SPaolo Bonzini int status = VIRTIO_BLK_S_OK; 1345a05cbeeSFam Zheng struct virtio_scsi_inhdr *scsi = NULL; 135783d1897SRusty Russell VirtIODevice *vdev = VIRTIO_DEVICE(blk); 136783d1897SRusty Russell 1375a05cbeeSFam Zheng #ifdef __linux__ 1385a05cbeeSFam Zheng int i; 1395a05cbeeSFam Zheng struct sg_io_hdr hdr; 1405a05cbeeSFam Zheng #endif 1416e790746SPaolo Bonzini 1426e790746SPaolo Bonzini /* 1436e790746SPaolo Bonzini * We require at least one output segment each for the virtio_blk_outhdr 1446e790746SPaolo Bonzini * and the SCSI command block. 1456e790746SPaolo Bonzini * 1466e790746SPaolo Bonzini * We also at least require the virtio_blk_inhdr, the virtio_scsi_inhdr 1476e790746SPaolo Bonzini * and the sense buffer pointer in the input segments. 1486e790746SPaolo Bonzini */ 1495a05cbeeSFam Zheng if (elem->out_num < 2 || elem->in_num < 3) { 1505a05cbeeSFam Zheng status = VIRTIO_BLK_S_IOERR; 1515a05cbeeSFam Zheng goto fail; 1526e790746SPaolo Bonzini } 1536e790746SPaolo Bonzini 1546e790746SPaolo Bonzini /* 1556e790746SPaolo Bonzini * The scsi inhdr is placed in the second-to-last input segment, just 1566e790746SPaolo Bonzini * before the regular inhdr. 1576e790746SPaolo Bonzini */ 1585a05cbeeSFam Zheng scsi = (void *)elem->in_sg[elem->in_num - 2].iov_base; 1596e790746SPaolo Bonzini 1605a05cbeeSFam Zheng if (!blk->blk.scsi) { 1616e790746SPaolo Bonzini status = VIRTIO_BLK_S_UNSUPP; 1626e790746SPaolo Bonzini goto fail; 1636e790746SPaolo Bonzini } 1646e790746SPaolo Bonzini 1656e790746SPaolo Bonzini /* 1666e790746SPaolo Bonzini * No support for bidirection commands yet. 1676e790746SPaolo Bonzini */ 1685a05cbeeSFam Zheng if (elem->out_num > 2 && elem->in_num > 3) { 1696e790746SPaolo Bonzini status = VIRTIO_BLK_S_UNSUPP; 1706e790746SPaolo Bonzini goto fail; 1716e790746SPaolo Bonzini } 1726e790746SPaolo Bonzini 1736e790746SPaolo Bonzini #ifdef __linux__ 1746e790746SPaolo Bonzini memset(&hdr, 0, sizeof(struct sg_io_hdr)); 1756e790746SPaolo Bonzini hdr.interface_id = 'S'; 1765a05cbeeSFam Zheng hdr.cmd_len = elem->out_sg[1].iov_len; 1775a05cbeeSFam Zheng hdr.cmdp = elem->out_sg[1].iov_base; 1786e790746SPaolo Bonzini hdr.dxfer_len = 0; 1796e790746SPaolo Bonzini 1805a05cbeeSFam Zheng if (elem->out_num > 2) { 1816e790746SPaolo Bonzini /* 1826e790746SPaolo Bonzini * If there are more than the minimally required 2 output segments 1836e790746SPaolo Bonzini * there is write payload starting from the third iovec. 1846e790746SPaolo Bonzini */ 1856e790746SPaolo Bonzini hdr.dxfer_direction = SG_DXFER_TO_DEV; 1865a05cbeeSFam Zheng hdr.iovec_count = elem->out_num - 2; 1876e790746SPaolo Bonzini 1886e790746SPaolo Bonzini for (i = 0; i < hdr.iovec_count; i++) 1895a05cbeeSFam Zheng hdr.dxfer_len += elem->out_sg[i + 2].iov_len; 1906e790746SPaolo Bonzini 1915a05cbeeSFam Zheng hdr.dxferp = elem->out_sg + 2; 1926e790746SPaolo Bonzini 1935a05cbeeSFam Zheng } else if (elem->in_num > 3) { 1946e790746SPaolo Bonzini /* 1956e790746SPaolo Bonzini * If we have more than 3 input segments the guest wants to actually 1966e790746SPaolo Bonzini * read data. 1976e790746SPaolo Bonzini */ 1986e790746SPaolo Bonzini hdr.dxfer_direction = SG_DXFER_FROM_DEV; 1995a05cbeeSFam Zheng hdr.iovec_count = elem->in_num - 3; 2006e790746SPaolo Bonzini for (i = 0; i < hdr.iovec_count; i++) 2015a05cbeeSFam Zheng hdr.dxfer_len += elem->in_sg[i].iov_len; 2026e790746SPaolo Bonzini 2035a05cbeeSFam Zheng hdr.dxferp = elem->in_sg; 2046e790746SPaolo Bonzini } else { 2056e790746SPaolo Bonzini /* 2066e790746SPaolo Bonzini * Some SCSI commands don't actually transfer any data. 2076e790746SPaolo Bonzini */ 2086e790746SPaolo Bonzini hdr.dxfer_direction = SG_DXFER_NONE; 2096e790746SPaolo Bonzini } 2106e790746SPaolo Bonzini 2115a05cbeeSFam Zheng hdr.sbp = elem->in_sg[elem->in_num - 3].iov_base; 2125a05cbeeSFam Zheng hdr.mx_sb_len = elem->in_sg[elem->in_num - 3].iov_len; 2136e790746SPaolo Bonzini 2145a05cbeeSFam Zheng status = bdrv_ioctl(blk->bs, SG_IO, &hdr); 2155a05cbeeSFam Zheng if (status) { 2166e790746SPaolo Bonzini status = VIRTIO_BLK_S_UNSUPP; 2176e790746SPaolo Bonzini goto fail; 2186e790746SPaolo Bonzini } 2196e790746SPaolo Bonzini 2206e790746SPaolo Bonzini /* 2216e790746SPaolo Bonzini * From SCSI-Generic-HOWTO: "Some lower level drivers (e.g. ide-scsi) 2226e790746SPaolo Bonzini * clear the masked_status field [hence status gets cleared too, see 2236e790746SPaolo Bonzini * block/scsi_ioctl.c] even when a CHECK_CONDITION or COMMAND_TERMINATED 2246e790746SPaolo Bonzini * status has occurred. However they do set DRIVER_SENSE in driver_status 2256e790746SPaolo Bonzini * field. Also a (sb_len_wr > 0) indicates there is a sense buffer. 2266e790746SPaolo Bonzini */ 2276e790746SPaolo Bonzini if (hdr.status == 0 && hdr.sb_len_wr > 0) { 2286e790746SPaolo Bonzini hdr.status = CHECK_CONDITION; 2296e790746SPaolo Bonzini } 2306e790746SPaolo Bonzini 231783d1897SRusty Russell virtio_stl_p(vdev, &scsi->errors, 2326e790746SPaolo Bonzini hdr.status | (hdr.msg_status << 8) | 2336e790746SPaolo Bonzini (hdr.host_status << 16) | (hdr.driver_status << 24)); 234783d1897SRusty Russell virtio_stl_p(vdev, &scsi->residual, hdr.resid); 235783d1897SRusty Russell virtio_stl_p(vdev, &scsi->sense_len, hdr.sb_len_wr); 236783d1897SRusty Russell virtio_stl_p(vdev, &scsi->data_len, hdr.dxfer_len); 2376e790746SPaolo Bonzini 2385a05cbeeSFam Zheng return status; 2396e790746SPaolo Bonzini #else 2406e790746SPaolo Bonzini abort(); 2416e790746SPaolo Bonzini #endif 2426e790746SPaolo Bonzini 2436e790746SPaolo Bonzini fail: 2446e790746SPaolo Bonzini /* Just put anything nonzero so that the ioctl fails in the guest. */ 2455a05cbeeSFam Zheng if (scsi) { 246783d1897SRusty Russell virtio_stl_p(vdev, &scsi->errors, 255); 2475a05cbeeSFam Zheng } 2485a05cbeeSFam Zheng return status; 2495a05cbeeSFam Zheng } 2505a05cbeeSFam Zheng 2515a05cbeeSFam Zheng static void virtio_blk_handle_scsi(VirtIOBlockReq *req) 2525a05cbeeSFam Zheng { 2535a05cbeeSFam Zheng int status; 2545a05cbeeSFam Zheng 255f897bf75SStefan Hajnoczi status = virtio_blk_handle_scsi_req(req->dev, &req->elem); 2566e790746SPaolo Bonzini virtio_blk_req_complete(req, status); 257671ec3f0SFam Zheng virtio_blk_free_request(req); 2586e790746SPaolo Bonzini } 2596e790746SPaolo Bonzini 260fee65db7SFam Zheng void virtio_submit_multiwrite(BlockDriverState *bs, MultiReqBuffer *mrb) 2616e790746SPaolo Bonzini { 2626e790746SPaolo Bonzini int i, ret; 2636e790746SPaolo Bonzini 2646e790746SPaolo Bonzini if (!mrb->num_writes) { 2656e790746SPaolo Bonzini return; 2666e790746SPaolo Bonzini } 2676e790746SPaolo Bonzini 2686e790746SPaolo Bonzini ret = bdrv_aio_multiwrite(bs, mrb->blkreq, mrb->num_writes); 2696e790746SPaolo Bonzini if (ret != 0) { 2706e790746SPaolo Bonzini for (i = 0; i < mrb->num_writes; i++) { 2716e790746SPaolo Bonzini if (mrb->blkreq[i].error) { 2726e790746SPaolo Bonzini virtio_blk_rw_complete(mrb->blkreq[i].opaque, -EIO); 2736e790746SPaolo Bonzini } 2746e790746SPaolo Bonzini } 2756e790746SPaolo Bonzini } 2766e790746SPaolo Bonzini 2776e790746SPaolo Bonzini mrb->num_writes = 0; 2786e790746SPaolo Bonzini } 2796e790746SPaolo Bonzini 2806e790746SPaolo Bonzini static void virtio_blk_handle_flush(VirtIOBlockReq *req, MultiReqBuffer *mrb) 2816e790746SPaolo Bonzini { 2826e790746SPaolo Bonzini bdrv_acct_start(req->dev->bs, &req->acct, 0, BDRV_ACCT_FLUSH); 2836e790746SPaolo Bonzini 2846e790746SPaolo Bonzini /* 2856e790746SPaolo Bonzini * Make sure all outstanding writes are posted to the backing device. 2866e790746SPaolo Bonzini */ 2876e790746SPaolo Bonzini virtio_submit_multiwrite(req->dev->bs, mrb); 2886e790746SPaolo Bonzini bdrv_aio_flush(req->dev->bs, virtio_blk_flush_complete, req); 2896e790746SPaolo Bonzini } 2906e790746SPaolo Bonzini 291d0e14376SMarkus Armbruster static bool virtio_blk_sect_range_ok(VirtIOBlock *dev, 292d0e14376SMarkus Armbruster uint64_t sector, size_t size) 293d0e14376SMarkus Armbruster { 294*3c2daac0SMarkus Armbruster uint64_t nb_sectors = size >> BDRV_SECTOR_BITS; 295*3c2daac0SMarkus Armbruster uint64_t total_sectors; 296*3c2daac0SMarkus Armbruster 297d0e14376SMarkus Armbruster if (sector & dev->sector_mask) { 298d0e14376SMarkus Armbruster return false; 299d0e14376SMarkus Armbruster } 300d0e14376SMarkus Armbruster if (size % dev->conf->logical_block_size) { 301d0e14376SMarkus Armbruster return false; 302d0e14376SMarkus Armbruster } 303*3c2daac0SMarkus Armbruster bdrv_get_geometry(dev->bs, &total_sectors); 304*3c2daac0SMarkus Armbruster if (sector > total_sectors || nb_sectors > total_sectors - sector) { 305*3c2daac0SMarkus Armbruster return false; 306*3c2daac0SMarkus Armbruster } 307d0e14376SMarkus Armbruster return true; 308d0e14376SMarkus Armbruster } 309d0e14376SMarkus Armbruster 3106e790746SPaolo Bonzini static void virtio_blk_handle_write(VirtIOBlockReq *req, MultiReqBuffer *mrb) 3116e790746SPaolo Bonzini { 3126e790746SPaolo Bonzini BlockRequest *blkreq; 3136e790746SPaolo Bonzini uint64_t sector; 3146e790746SPaolo Bonzini 315783d1897SRusty Russell sector = virtio_ldq_p(VIRTIO_DEVICE(req->dev), &req->out.sector); 3166e790746SPaolo Bonzini 3176e790746SPaolo Bonzini trace_virtio_blk_handle_write(req, sector, req->qiov.size / 512); 3186e790746SPaolo Bonzini 319d0e14376SMarkus Armbruster if (!virtio_blk_sect_range_ok(req->dev, sector, req->qiov.size)) { 32042e38c1fSMarkus Armbruster virtio_blk_req_complete(req, VIRTIO_BLK_S_IOERR); 32142e38c1fSMarkus Armbruster virtio_blk_free_request(req); 3226e790746SPaolo Bonzini return; 3236e790746SPaolo Bonzini } 3246e790746SPaolo Bonzini 32542e38c1fSMarkus Armbruster bdrv_acct_start(req->dev->bs, &req->acct, req->qiov.size, BDRV_ACCT_WRITE); 32642e38c1fSMarkus Armbruster 3276e790746SPaolo Bonzini if (mrb->num_writes == 32) { 3286e790746SPaolo Bonzini virtio_submit_multiwrite(req->dev->bs, mrb); 3296e790746SPaolo Bonzini } 3306e790746SPaolo Bonzini 3316e790746SPaolo Bonzini blkreq = &mrb->blkreq[mrb->num_writes]; 3326e790746SPaolo Bonzini blkreq->sector = sector; 3336e790746SPaolo Bonzini blkreq->nb_sectors = req->qiov.size / BDRV_SECTOR_SIZE; 3346e790746SPaolo Bonzini blkreq->qiov = &req->qiov; 3356e790746SPaolo Bonzini blkreq->cb = virtio_blk_rw_complete; 3366e790746SPaolo Bonzini blkreq->opaque = req; 3376e790746SPaolo Bonzini blkreq->error = 0; 3386e790746SPaolo Bonzini 3396e790746SPaolo Bonzini mrb->num_writes++; 3406e790746SPaolo Bonzini } 3416e790746SPaolo Bonzini 3426e790746SPaolo Bonzini static void virtio_blk_handle_read(VirtIOBlockReq *req) 3436e790746SPaolo Bonzini { 3446e790746SPaolo Bonzini uint64_t sector; 3456e790746SPaolo Bonzini 346783d1897SRusty Russell sector = virtio_ldq_p(VIRTIO_DEVICE(req->dev), &req->out.sector); 3476e790746SPaolo Bonzini 3486e790746SPaolo Bonzini trace_virtio_blk_handle_read(req, sector, req->qiov.size / 512); 3496e790746SPaolo Bonzini 350d0e14376SMarkus Armbruster if (!virtio_blk_sect_range_ok(req->dev, sector, req->qiov.size)) { 35142e38c1fSMarkus Armbruster virtio_blk_req_complete(req, VIRTIO_BLK_S_IOERR); 35242e38c1fSMarkus Armbruster virtio_blk_free_request(req); 3536e790746SPaolo Bonzini return; 3546e790746SPaolo Bonzini } 35542e38c1fSMarkus Armbruster 35642e38c1fSMarkus Armbruster bdrv_acct_start(req->dev->bs, &req->acct, req->qiov.size, BDRV_ACCT_READ); 3576e790746SPaolo Bonzini bdrv_aio_readv(req->dev->bs, sector, &req->qiov, 3586e790746SPaolo Bonzini req->qiov.size / BDRV_SECTOR_SIZE, 3596e790746SPaolo Bonzini virtio_blk_rw_complete, req); 3606e790746SPaolo Bonzini } 3616e790746SPaolo Bonzini 362fee65db7SFam Zheng void virtio_blk_handle_request(VirtIOBlockReq *req, MultiReqBuffer *mrb) 3636e790746SPaolo Bonzini { 3646e790746SPaolo Bonzini uint32_t type; 365f897bf75SStefan Hajnoczi struct iovec *in_iov = req->elem.in_sg; 366f897bf75SStefan Hajnoczi struct iovec *iov = req->elem.out_sg; 367f897bf75SStefan Hajnoczi unsigned in_num = req->elem.in_num; 368f897bf75SStefan Hajnoczi unsigned out_num = req->elem.out_num; 3696e790746SPaolo Bonzini 370f897bf75SStefan Hajnoczi if (req->elem.out_num < 1 || req->elem.in_num < 1) { 3716e790746SPaolo Bonzini error_report("virtio-blk missing headers"); 3726e790746SPaolo Bonzini exit(1); 3736e790746SPaolo Bonzini } 3746e790746SPaolo Bonzini 375827805a2SFam Zheng if (unlikely(iov_to_buf(iov, out_num, 0, &req->out, 376827805a2SFam Zheng sizeof(req->out)) != sizeof(req->out))) { 377827805a2SFam Zheng error_report("virtio-blk request outhdr too short"); 378827805a2SFam Zheng exit(1); 379827805a2SFam Zheng } 380ee17e848SFam Zheng 381827805a2SFam Zheng iov_discard_front(&iov, &out_num, sizeof(req->out)); 382ee17e848SFam Zheng 383ee17e848SFam Zheng if (in_num < 1 || 384ee17e848SFam Zheng in_iov[in_num - 1].iov_len < sizeof(struct virtio_blk_inhdr)) { 385ee17e848SFam Zheng error_report("virtio-blk request inhdr too short"); 386ee17e848SFam Zheng exit(1); 387ee17e848SFam Zheng } 388ee17e848SFam Zheng 389ee17e848SFam Zheng req->in = (void *)in_iov[in_num - 1].iov_base 390ee17e848SFam Zheng + in_iov[in_num - 1].iov_len 391ee17e848SFam Zheng - sizeof(struct virtio_blk_inhdr); 392ee17e848SFam Zheng iov_discard_back(in_iov, &in_num, sizeof(struct virtio_blk_inhdr)); 3936e790746SPaolo Bonzini 394783d1897SRusty Russell type = virtio_ldl_p(VIRTIO_DEVICE(req->dev), &req->out.type); 3956e790746SPaolo Bonzini 3966e790746SPaolo Bonzini if (type & VIRTIO_BLK_T_FLUSH) { 3976e790746SPaolo Bonzini virtio_blk_handle_flush(req, mrb); 3986e790746SPaolo Bonzini } else if (type & VIRTIO_BLK_T_SCSI_CMD) { 3996e790746SPaolo Bonzini virtio_blk_handle_scsi(req); 4006e790746SPaolo Bonzini } else if (type & VIRTIO_BLK_T_GET_ID) { 4016e790746SPaolo Bonzini VirtIOBlock *s = req->dev; 4026e790746SPaolo Bonzini 4036e790746SPaolo Bonzini /* 4046e790746SPaolo Bonzini * NB: per existing s/n string convention the string is 4056e790746SPaolo Bonzini * terminated by '\0' only when shorter than buffer. 4066e790746SPaolo Bonzini */ 407f897bf75SStefan Hajnoczi strncpy(req->elem.in_sg[0].iov_base, 4086e790746SPaolo Bonzini s->blk.serial ? s->blk.serial : "", 409f897bf75SStefan Hajnoczi MIN(req->elem.in_sg[0].iov_len, VIRTIO_BLK_ID_BYTES)); 4106e790746SPaolo Bonzini virtio_blk_req_complete(req, VIRTIO_BLK_S_OK); 411671ec3f0SFam Zheng virtio_blk_free_request(req); 4126e790746SPaolo Bonzini } else if (type & VIRTIO_BLK_T_OUT) { 413f897bf75SStefan Hajnoczi qemu_iovec_init_external(&req->qiov, &req->elem.out_sg[1], 414f897bf75SStefan Hajnoczi req->elem.out_num - 1); 4156e790746SPaolo Bonzini virtio_blk_handle_write(req, mrb); 4166e790746SPaolo Bonzini } else if (type == VIRTIO_BLK_T_IN || type == VIRTIO_BLK_T_BARRIER) { 4176e790746SPaolo Bonzini /* VIRTIO_BLK_T_IN is 0, so we can't just & it. */ 418f897bf75SStefan Hajnoczi qemu_iovec_init_external(&req->qiov, &req->elem.in_sg[0], 419f897bf75SStefan Hajnoczi req->elem.in_num - 1); 4206e790746SPaolo Bonzini virtio_blk_handle_read(req); 4216e790746SPaolo Bonzini } else { 4226e790746SPaolo Bonzini virtio_blk_req_complete(req, VIRTIO_BLK_S_UNSUPP); 423671ec3f0SFam Zheng virtio_blk_free_request(req); 4246e790746SPaolo Bonzini } 4256e790746SPaolo Bonzini } 4266e790746SPaolo Bonzini 4276e790746SPaolo Bonzini static void virtio_blk_handle_output(VirtIODevice *vdev, VirtQueue *vq) 4286e790746SPaolo Bonzini { 4296e790746SPaolo Bonzini VirtIOBlock *s = VIRTIO_BLK(vdev); 4306e790746SPaolo Bonzini VirtIOBlockReq *req; 4316e790746SPaolo Bonzini MultiReqBuffer mrb = { 4326e790746SPaolo Bonzini .num_writes = 0, 4336e790746SPaolo Bonzini }; 4346e790746SPaolo Bonzini 4356e790746SPaolo Bonzini #ifdef CONFIG_VIRTIO_BLK_DATA_PLANE 4366e790746SPaolo Bonzini /* Some guests kick before setting VIRTIO_CONFIG_S_DRIVER_OK so start 4376e790746SPaolo Bonzini * dataplane here instead of waiting for .set_status(). 4386e790746SPaolo Bonzini */ 4396e790746SPaolo Bonzini if (s->dataplane) { 4406e790746SPaolo Bonzini virtio_blk_data_plane_start(s->dataplane); 4416e790746SPaolo Bonzini return; 4426e790746SPaolo Bonzini } 4436e790746SPaolo Bonzini #endif 4446e790746SPaolo Bonzini 4456e790746SPaolo Bonzini while ((req = virtio_blk_get_request(s))) { 4466e790746SPaolo Bonzini virtio_blk_handle_request(req, &mrb); 4476e790746SPaolo Bonzini } 4486e790746SPaolo Bonzini 4496e790746SPaolo Bonzini virtio_submit_multiwrite(s->bs, &mrb); 4506e790746SPaolo Bonzini 4516e790746SPaolo Bonzini /* 4526e790746SPaolo Bonzini * FIXME: Want to check for completions before returning to guest mode, 4536e790746SPaolo Bonzini * so cached reads and writes are reported as quickly as possible. But 4546e790746SPaolo Bonzini * that should be done in the generic block layer. 4556e790746SPaolo Bonzini */ 4566e790746SPaolo Bonzini } 4576e790746SPaolo Bonzini 4586e790746SPaolo Bonzini static void virtio_blk_dma_restart_bh(void *opaque) 4596e790746SPaolo Bonzini { 4606e790746SPaolo Bonzini VirtIOBlock *s = opaque; 4616e790746SPaolo Bonzini VirtIOBlockReq *req = s->rq; 4626e790746SPaolo Bonzini MultiReqBuffer mrb = { 4636e790746SPaolo Bonzini .num_writes = 0, 4646e790746SPaolo Bonzini }; 4656e790746SPaolo Bonzini 4666e790746SPaolo Bonzini qemu_bh_delete(s->bh); 4676e790746SPaolo Bonzini s->bh = NULL; 4686e790746SPaolo Bonzini 4696e790746SPaolo Bonzini s->rq = NULL; 4706e790746SPaolo Bonzini 4716e790746SPaolo Bonzini while (req) { 4726e790746SPaolo Bonzini virtio_blk_handle_request(req, &mrb); 4736e790746SPaolo Bonzini req = req->next; 4746e790746SPaolo Bonzini } 4756e790746SPaolo Bonzini 4766e790746SPaolo Bonzini virtio_submit_multiwrite(s->bs, &mrb); 4776e790746SPaolo Bonzini } 4786e790746SPaolo Bonzini 4796e790746SPaolo Bonzini static void virtio_blk_dma_restart_cb(void *opaque, int running, 4806e790746SPaolo Bonzini RunState state) 4816e790746SPaolo Bonzini { 4826e790746SPaolo Bonzini VirtIOBlock *s = opaque; 4836e790746SPaolo Bonzini 4846e790746SPaolo Bonzini if (!running) { 4856e790746SPaolo Bonzini return; 4866e790746SPaolo Bonzini } 4876e790746SPaolo Bonzini 4886e790746SPaolo Bonzini if (!s->bh) { 4894407c1c5SFam Zheng s->bh = aio_bh_new(bdrv_get_aio_context(s->blk.conf.bs), 4904407c1c5SFam Zheng virtio_blk_dma_restart_bh, s); 4916e790746SPaolo Bonzini qemu_bh_schedule(s->bh); 4926e790746SPaolo Bonzini } 4936e790746SPaolo Bonzini } 4946e790746SPaolo Bonzini 4956e790746SPaolo Bonzini static void virtio_blk_reset(VirtIODevice *vdev) 4966e790746SPaolo Bonzini { 4976e790746SPaolo Bonzini VirtIOBlock *s = VIRTIO_BLK(vdev); 4986e790746SPaolo Bonzini 499ef5bc962SPaolo Bonzini #ifdef CONFIG_VIRTIO_BLK_DATA_PLANE 5006e790746SPaolo Bonzini if (s->dataplane) { 5016e790746SPaolo Bonzini virtio_blk_data_plane_stop(s->dataplane); 5026e790746SPaolo Bonzini } 5036e790746SPaolo Bonzini #endif 5046e790746SPaolo Bonzini 5056e790746SPaolo Bonzini /* 5066e790746SPaolo Bonzini * This should cancel pending requests, but can't do nicely until there 5076e790746SPaolo Bonzini * are per-device request lists. 5086e790746SPaolo Bonzini */ 5096e790746SPaolo Bonzini bdrv_drain_all(); 510ef5bc962SPaolo Bonzini bdrv_set_enable_write_cache(s->bs, s->original_wce); 5116e790746SPaolo Bonzini } 5126e790746SPaolo Bonzini 5136e790746SPaolo Bonzini /* coalesce internal state, copy to pci i/o region 0 5146e790746SPaolo Bonzini */ 5156e790746SPaolo Bonzini static void virtio_blk_update_config(VirtIODevice *vdev, uint8_t *config) 5166e790746SPaolo Bonzini { 5176e790746SPaolo Bonzini VirtIOBlock *s = VIRTIO_BLK(vdev); 5186e790746SPaolo Bonzini struct virtio_blk_config blkcfg; 5196e790746SPaolo Bonzini uint64_t capacity; 5206e790746SPaolo Bonzini int blk_size = s->conf->logical_block_size; 5216e790746SPaolo Bonzini 5226e790746SPaolo Bonzini bdrv_get_geometry(s->bs, &capacity); 5236e790746SPaolo Bonzini memset(&blkcfg, 0, sizeof(blkcfg)); 524783d1897SRusty Russell virtio_stq_p(vdev, &blkcfg.capacity, capacity); 525783d1897SRusty Russell virtio_stl_p(vdev, &blkcfg.seg_max, 128 - 2); 526783d1897SRusty Russell virtio_stw_p(vdev, &blkcfg.cylinders, s->conf->cyls); 527783d1897SRusty Russell virtio_stl_p(vdev, &blkcfg.blk_size, blk_size); 528783d1897SRusty Russell virtio_stw_p(vdev, &blkcfg.min_io_size, s->conf->min_io_size / blk_size); 529783d1897SRusty Russell virtio_stw_p(vdev, &blkcfg.opt_io_size, s->conf->opt_io_size / blk_size); 5306e790746SPaolo Bonzini blkcfg.heads = s->conf->heads; 5316e790746SPaolo Bonzini /* 5326e790746SPaolo Bonzini * We must ensure that the block device capacity is a multiple of 533e03ba136SPeter Maydell * the logical block size. If that is not the case, let's use 5346e790746SPaolo Bonzini * sector_mask to adopt the geometry to have a correct picture. 5356e790746SPaolo Bonzini * For those devices where the capacity is ok for the given geometry 536e03ba136SPeter Maydell * we don't touch the sector value of the geometry, since some devices 5376e790746SPaolo Bonzini * (like s390 dasd) need a specific value. Here the capacity is already 5386e790746SPaolo Bonzini * cyls*heads*secs*blk_size and the sector value is not block size 5396e790746SPaolo Bonzini * divided by 512 - instead it is the amount of blk_size blocks 5406e790746SPaolo Bonzini * per track (cylinder). 5416e790746SPaolo Bonzini */ 5426e790746SPaolo Bonzini if (bdrv_getlength(s->bs) / s->conf->heads / s->conf->secs % blk_size) { 5436e790746SPaolo Bonzini blkcfg.sectors = s->conf->secs & ~s->sector_mask; 5446e790746SPaolo Bonzini } else { 5456e790746SPaolo Bonzini blkcfg.sectors = s->conf->secs; 5466e790746SPaolo Bonzini } 5476e790746SPaolo Bonzini blkcfg.size_max = 0; 5486e790746SPaolo Bonzini blkcfg.physical_block_exp = get_physical_block_exp(s->conf); 5496e790746SPaolo Bonzini blkcfg.alignment_offset = 0; 5506e790746SPaolo Bonzini blkcfg.wce = bdrv_enable_write_cache(s->bs); 5516e790746SPaolo Bonzini memcpy(config, &blkcfg, sizeof(struct virtio_blk_config)); 5526e790746SPaolo Bonzini } 5536e790746SPaolo Bonzini 5546e790746SPaolo Bonzini static void virtio_blk_set_config(VirtIODevice *vdev, const uint8_t *config) 5556e790746SPaolo Bonzini { 5566e790746SPaolo Bonzini VirtIOBlock *s = VIRTIO_BLK(vdev); 5576e790746SPaolo Bonzini struct virtio_blk_config blkcfg; 5586e790746SPaolo Bonzini 5596e790746SPaolo Bonzini memcpy(&blkcfg, config, sizeof(blkcfg)); 5606d7e73d6SFam Zheng 5616d7e73d6SFam Zheng aio_context_acquire(bdrv_get_aio_context(s->bs)); 5626e790746SPaolo Bonzini bdrv_set_enable_write_cache(s->bs, blkcfg.wce != 0); 5636d7e73d6SFam Zheng aio_context_release(bdrv_get_aio_context(s->bs)); 5646e790746SPaolo Bonzini } 5656e790746SPaolo Bonzini 5666e790746SPaolo Bonzini static uint32_t virtio_blk_get_features(VirtIODevice *vdev, uint32_t features) 5676e790746SPaolo Bonzini { 5686e790746SPaolo Bonzini VirtIOBlock *s = VIRTIO_BLK(vdev); 5696e790746SPaolo Bonzini 5706e790746SPaolo Bonzini features |= (1 << VIRTIO_BLK_F_SEG_MAX); 5716e790746SPaolo Bonzini features |= (1 << VIRTIO_BLK_F_GEOMETRY); 5726e790746SPaolo Bonzini features |= (1 << VIRTIO_BLK_F_TOPOLOGY); 5736e790746SPaolo Bonzini features |= (1 << VIRTIO_BLK_F_BLK_SIZE); 5746e790746SPaolo Bonzini features |= (1 << VIRTIO_BLK_F_SCSI); 5756e790746SPaolo Bonzini 5766e790746SPaolo Bonzini if (s->blk.config_wce) { 5776e790746SPaolo Bonzini features |= (1 << VIRTIO_BLK_F_CONFIG_WCE); 5786e790746SPaolo Bonzini } 5796e790746SPaolo Bonzini if (bdrv_enable_write_cache(s->bs)) 5806e790746SPaolo Bonzini features |= (1 << VIRTIO_BLK_F_WCE); 5816e790746SPaolo Bonzini 5826e790746SPaolo Bonzini if (bdrv_is_read_only(s->bs)) 5836e790746SPaolo Bonzini features |= 1 << VIRTIO_BLK_F_RO; 5846e790746SPaolo Bonzini 5856e790746SPaolo Bonzini return features; 5866e790746SPaolo Bonzini } 5876e790746SPaolo Bonzini 5886e790746SPaolo Bonzini static void virtio_blk_set_status(VirtIODevice *vdev, uint8_t status) 5896e790746SPaolo Bonzini { 5906e790746SPaolo Bonzini VirtIOBlock *s = VIRTIO_BLK(vdev); 5916e790746SPaolo Bonzini uint32_t features; 5926e790746SPaolo Bonzini 5936e790746SPaolo Bonzini #ifdef CONFIG_VIRTIO_BLK_DATA_PLANE 5946e790746SPaolo Bonzini if (s->dataplane && !(status & (VIRTIO_CONFIG_S_DRIVER | 5956e790746SPaolo Bonzini VIRTIO_CONFIG_S_DRIVER_OK))) { 5966e790746SPaolo Bonzini virtio_blk_data_plane_stop(s->dataplane); 5976e790746SPaolo Bonzini } 5986e790746SPaolo Bonzini #endif 5996e790746SPaolo Bonzini 6006e790746SPaolo Bonzini if (!(status & VIRTIO_CONFIG_S_DRIVER_OK)) { 6016e790746SPaolo Bonzini return; 6026e790746SPaolo Bonzini } 6036e790746SPaolo Bonzini 6046e790746SPaolo Bonzini features = vdev->guest_features; 605ef5bc962SPaolo Bonzini 606ef5bc962SPaolo Bonzini /* A guest that supports VIRTIO_BLK_F_CONFIG_WCE must be able to send 607ef5bc962SPaolo Bonzini * cache flushes. Thus, the "auto writethrough" behavior is never 608ef5bc962SPaolo Bonzini * necessary for guests that support the VIRTIO_BLK_F_CONFIG_WCE feature. 609ef5bc962SPaolo Bonzini * Leaving it enabled would break the following sequence: 610ef5bc962SPaolo Bonzini * 611ef5bc962SPaolo Bonzini * Guest started with "-drive cache=writethrough" 612ef5bc962SPaolo Bonzini * Guest sets status to 0 613ef5bc962SPaolo Bonzini * Guest sets DRIVER bit in status field 614ef5bc962SPaolo Bonzini * Guest reads host features (WCE=0, CONFIG_WCE=1) 615ef5bc962SPaolo Bonzini * Guest writes guest features (WCE=0, CONFIG_WCE=1) 616ef5bc962SPaolo Bonzini * Guest writes 1 to the WCE configuration field (writeback mode) 617ef5bc962SPaolo Bonzini * Guest sets DRIVER_OK bit in status field 618ef5bc962SPaolo Bonzini * 619ef5bc962SPaolo Bonzini * s->bs would erroneously be placed in writethrough mode. 620ef5bc962SPaolo Bonzini */ 621ef5bc962SPaolo Bonzini if (!(features & (1 << VIRTIO_BLK_F_CONFIG_WCE))) { 6226d7e73d6SFam Zheng aio_context_acquire(bdrv_get_aio_context(s->bs)); 6236d7e73d6SFam Zheng bdrv_set_enable_write_cache(s->bs, 6246d7e73d6SFam Zheng !!(features & (1 << VIRTIO_BLK_F_WCE))); 6256d7e73d6SFam Zheng aio_context_release(bdrv_get_aio_context(s->bs)); 6266e790746SPaolo Bonzini } 627ef5bc962SPaolo Bonzini } 6286e790746SPaolo Bonzini 6296e790746SPaolo Bonzini static void virtio_blk_save(QEMUFile *f, void *opaque) 6306e790746SPaolo Bonzini { 631b2b295a7SGreg Kurz VirtIODevice *vdev = VIRTIO_DEVICE(opaque); 6326e790746SPaolo Bonzini 6336e790746SPaolo Bonzini virtio_save(vdev, f); 634b2b295a7SGreg Kurz } 635b2b295a7SGreg Kurz 636b2b295a7SGreg Kurz static void virtio_blk_save_device(VirtIODevice *vdev, QEMUFile *f) 637b2b295a7SGreg Kurz { 638b2b295a7SGreg Kurz VirtIOBlock *s = VIRTIO_BLK(vdev); 639b2b295a7SGreg Kurz VirtIOBlockReq *req = s->rq; 6406e790746SPaolo Bonzini 6416e790746SPaolo Bonzini while (req) { 6426e790746SPaolo Bonzini qemu_put_sbyte(f, 1); 643f897bf75SStefan Hajnoczi qemu_put_buffer(f, (unsigned char *)&req->elem, 644671ec3f0SFam Zheng sizeof(VirtQueueElement)); 6456e790746SPaolo Bonzini req = req->next; 6466e790746SPaolo Bonzini } 6476e790746SPaolo Bonzini qemu_put_sbyte(f, 0); 6486e790746SPaolo Bonzini } 6496e790746SPaolo Bonzini 6506e790746SPaolo Bonzini static int virtio_blk_load(QEMUFile *f, void *opaque, int version_id) 6516e790746SPaolo Bonzini { 6526e790746SPaolo Bonzini VirtIOBlock *s = opaque; 6536e790746SPaolo Bonzini VirtIODevice *vdev = VIRTIO_DEVICE(s); 6546e790746SPaolo Bonzini 6556e790746SPaolo Bonzini if (version_id != 2) 6566e790746SPaolo Bonzini return -EINVAL; 6576e790746SPaolo Bonzini 658b2b295a7SGreg Kurz return virtio_load(vdev, f, version_id); 6596e790746SPaolo Bonzini } 6606e790746SPaolo Bonzini 661b2b295a7SGreg Kurz static int virtio_blk_load_device(VirtIODevice *vdev, QEMUFile *f, 662b2b295a7SGreg Kurz int version_id) 663b2b295a7SGreg Kurz { 664b2b295a7SGreg Kurz VirtIOBlock *s = VIRTIO_BLK(vdev); 665b2b295a7SGreg Kurz 6666e790746SPaolo Bonzini while (qemu_get_sbyte(f)) { 6676e790746SPaolo Bonzini VirtIOBlockReq *req = virtio_blk_alloc_request(s); 668f897bf75SStefan Hajnoczi qemu_get_buffer(f, (unsigned char *)&req->elem, 669671ec3f0SFam Zheng sizeof(VirtQueueElement)); 6706e790746SPaolo Bonzini req->next = s->rq; 6716e790746SPaolo Bonzini s->rq = req; 6726e790746SPaolo Bonzini 673f897bf75SStefan Hajnoczi virtqueue_map_sg(req->elem.in_sg, req->elem.in_addr, 674f897bf75SStefan Hajnoczi req->elem.in_num, 1); 675f897bf75SStefan Hajnoczi virtqueue_map_sg(req->elem.out_sg, req->elem.out_addr, 676f897bf75SStefan Hajnoczi req->elem.out_num, 0); 6776e790746SPaolo Bonzini } 6786e790746SPaolo Bonzini 6796e790746SPaolo Bonzini return 0; 6806e790746SPaolo Bonzini } 6816e790746SPaolo Bonzini 6826e790746SPaolo Bonzini static void virtio_blk_resize(void *opaque) 6836e790746SPaolo Bonzini { 6846e790746SPaolo Bonzini VirtIODevice *vdev = VIRTIO_DEVICE(opaque); 6856e790746SPaolo Bonzini 6866e790746SPaolo Bonzini virtio_notify_config(vdev); 6876e790746SPaolo Bonzini } 6886e790746SPaolo Bonzini 6896e790746SPaolo Bonzini static const BlockDevOps virtio_block_ops = { 6906e790746SPaolo Bonzini .resize_cb = virtio_blk_resize, 6916e790746SPaolo Bonzini }; 6926e790746SPaolo Bonzini 69384db52d0SStefan Hajnoczi #ifdef CONFIG_VIRTIO_BLK_DATA_PLANE 69484db52d0SStefan Hajnoczi /* Disable dataplane thread during live migration since it does not 69584db52d0SStefan Hajnoczi * update the dirty memory bitmap yet. 69684db52d0SStefan Hajnoczi */ 69784db52d0SStefan Hajnoczi static void virtio_blk_migration_state_changed(Notifier *notifier, void *data) 69884db52d0SStefan Hajnoczi { 69984db52d0SStefan Hajnoczi VirtIOBlock *s = container_of(notifier, VirtIOBlock, 70084db52d0SStefan Hajnoczi migration_state_notifier); 70184db52d0SStefan Hajnoczi MigrationState *mig = data; 7023ffeeef7SAndreas Färber Error *err = NULL; 70384db52d0SStefan Hajnoczi 70484db52d0SStefan Hajnoczi if (migration_in_setup(mig)) { 70584db52d0SStefan Hajnoczi if (!s->dataplane) { 70684db52d0SStefan Hajnoczi return; 70784db52d0SStefan Hajnoczi } 70884db52d0SStefan Hajnoczi virtio_blk_data_plane_destroy(s->dataplane); 70984db52d0SStefan Hajnoczi s->dataplane = NULL; 71084db52d0SStefan Hajnoczi } else if (migration_has_finished(mig) || 71184db52d0SStefan Hajnoczi migration_has_failed(mig)) { 71284db52d0SStefan Hajnoczi if (s->dataplane) { 71384db52d0SStefan Hajnoczi return; 71484db52d0SStefan Hajnoczi } 71584db52d0SStefan Hajnoczi bdrv_drain_all(); /* complete in-flight non-dataplane requests */ 71684db52d0SStefan Hajnoczi virtio_blk_data_plane_create(VIRTIO_DEVICE(s), &s->blk, 7173ffeeef7SAndreas Färber &s->dataplane, &err); 7183ffeeef7SAndreas Färber if (err != NULL) { 7193ffeeef7SAndreas Färber error_report("%s", error_get_pretty(err)); 7203ffeeef7SAndreas Färber error_free(err); 7213ffeeef7SAndreas Färber } 72284db52d0SStefan Hajnoczi } 72384db52d0SStefan Hajnoczi } 72484db52d0SStefan Hajnoczi #endif /* CONFIG_VIRTIO_BLK_DATA_PLANE */ 72584db52d0SStefan Hajnoczi 72675884afdSAndreas Färber static void virtio_blk_device_realize(DeviceState *dev, Error **errp) 7276e790746SPaolo Bonzini { 72875884afdSAndreas Färber VirtIODevice *vdev = VIRTIO_DEVICE(dev); 729179b417eSAndreas Färber VirtIOBlock *s = VIRTIO_BLK(dev); 7306e790746SPaolo Bonzini VirtIOBlkConf *blk = &(s->blk); 7313ffeeef7SAndreas Färber #ifdef CONFIG_VIRTIO_BLK_DATA_PLANE 7323ffeeef7SAndreas Färber Error *err = NULL; 7333ffeeef7SAndreas Färber #endif 7346e790746SPaolo Bonzini static int virtio_blk_id; 7356e790746SPaolo Bonzini 7366e790746SPaolo Bonzini if (!blk->conf.bs) { 73775884afdSAndreas Färber error_setg(errp, "drive property not set"); 73875884afdSAndreas Färber return; 7396e790746SPaolo Bonzini } 7406e790746SPaolo Bonzini if (!bdrv_is_inserted(blk->conf.bs)) { 74175884afdSAndreas Färber error_setg(errp, "Device needs media, but drive is empty"); 74275884afdSAndreas Färber return; 7436e790746SPaolo Bonzini } 7446e790746SPaolo Bonzini 7456e790746SPaolo Bonzini blkconf_serial(&blk->conf, &blk->serial); 746ef5bc962SPaolo Bonzini s->original_wce = bdrv_enable_write_cache(blk->conf.bs); 7476e790746SPaolo Bonzini if (blkconf_geometry(&blk->conf, NULL, 65535, 255, 255) < 0) { 74875884afdSAndreas Färber error_setg(errp, "Error setting geometry"); 74975884afdSAndreas Färber return; 7506e790746SPaolo Bonzini } 7516e790746SPaolo Bonzini 7526e790746SPaolo Bonzini virtio_init(vdev, "virtio-blk", VIRTIO_ID_BLOCK, 7536e790746SPaolo Bonzini sizeof(struct virtio_blk_config)); 7546e790746SPaolo Bonzini 7556e790746SPaolo Bonzini s->bs = blk->conf.bs; 7566e790746SPaolo Bonzini s->conf = &blk->conf; 7576e790746SPaolo Bonzini s->rq = NULL; 7586e790746SPaolo Bonzini s->sector_mask = (s->conf->logical_block_size / BDRV_SECTOR_SIZE) - 1; 7596e790746SPaolo Bonzini 7606e790746SPaolo Bonzini s->vq = virtio_add_queue(vdev, 128, virtio_blk_handle_output); 761bf4bd461SFam Zheng s->complete_request = virtio_blk_complete_request; 7626e790746SPaolo Bonzini #ifdef CONFIG_VIRTIO_BLK_DATA_PLANE 7633ffeeef7SAndreas Färber virtio_blk_data_plane_create(vdev, blk, &s->dataplane, &err); 7643ffeeef7SAndreas Färber if (err != NULL) { 76575884afdSAndreas Färber error_propagate(errp, err); 7666a1a8cc7SKONRAD Frederic virtio_cleanup(vdev); 76775884afdSAndreas Färber return; 7686e790746SPaolo Bonzini } 76984db52d0SStefan Hajnoczi s->migration_state_notifier.notify = virtio_blk_migration_state_changed; 77084db52d0SStefan Hajnoczi add_migration_state_change_notifier(&s->migration_state_notifier); 7716e790746SPaolo Bonzini #endif 7726e790746SPaolo Bonzini 7736e790746SPaolo Bonzini s->change = qemu_add_vm_change_state_handler(virtio_blk_dma_restart_cb, s); 774179b417eSAndreas Färber register_savevm(dev, "virtio-blk", virtio_blk_id++, 2, 7756e790746SPaolo Bonzini virtio_blk_save, virtio_blk_load, s); 7766e790746SPaolo Bonzini bdrv_set_dev_ops(s->bs, &virtio_block_ops, s); 7771b7fd729SPaolo Bonzini bdrv_set_guest_block_size(s->bs, s->conf->logical_block_size); 7786e790746SPaolo Bonzini 7796e790746SPaolo Bonzini bdrv_iostatus_enable(s->bs); 7806e790746SPaolo Bonzini 781179b417eSAndreas Färber add_boot_device_path(s->conf->bootindex, dev, "/disk@0,0"); 7826e790746SPaolo Bonzini } 7836e790746SPaolo Bonzini 784306ec6c3SAndreas Färber static void virtio_blk_device_unrealize(DeviceState *dev, Error **errp) 7856e790746SPaolo Bonzini { 786306ec6c3SAndreas Färber VirtIODevice *vdev = VIRTIO_DEVICE(dev); 787306ec6c3SAndreas Färber VirtIOBlock *s = VIRTIO_BLK(dev); 788306ec6c3SAndreas Färber 7896e790746SPaolo Bonzini #ifdef CONFIG_VIRTIO_BLK_DATA_PLANE 79084db52d0SStefan Hajnoczi remove_migration_state_change_notifier(&s->migration_state_notifier); 7916e790746SPaolo Bonzini virtio_blk_data_plane_destroy(s->dataplane); 7926e790746SPaolo Bonzini s->dataplane = NULL; 7936e790746SPaolo Bonzini #endif 7946e790746SPaolo Bonzini qemu_del_vm_change_state_handler(s->change); 795306ec6c3SAndreas Färber unregister_savevm(dev, "virtio-blk", s); 7966e790746SPaolo Bonzini blockdev_mark_auto_del(s->bs); 7976a1a8cc7SKONRAD Frederic virtio_cleanup(vdev); 7986e790746SPaolo Bonzini } 7996e790746SPaolo Bonzini 800467b3f33SStefan Hajnoczi static void virtio_blk_instance_init(Object *obj) 801467b3f33SStefan Hajnoczi { 802467b3f33SStefan Hajnoczi VirtIOBlock *s = VIRTIO_BLK(obj); 803467b3f33SStefan Hajnoczi 804467b3f33SStefan Hajnoczi object_property_add_link(obj, "iothread", TYPE_IOTHREAD, 805467b3f33SStefan Hajnoczi (Object **)&s->blk.iothread, 806467b3f33SStefan Hajnoczi qdev_prop_allow_set_link_before_realize, 807467b3f33SStefan Hajnoczi OBJ_PROP_LINK_UNREF_ON_RELEASE, NULL); 808467b3f33SStefan Hajnoczi } 809467b3f33SStefan Hajnoczi 8106e790746SPaolo Bonzini static Property virtio_blk_properties[] = { 81132a877e4SStefan Hajnoczi DEFINE_BLOCK_PROPERTIES(VirtIOBlock, blk.conf), 81232a877e4SStefan Hajnoczi DEFINE_BLOCK_CHS_PROPERTIES(VirtIOBlock, blk.conf), 81332a877e4SStefan Hajnoczi DEFINE_PROP_STRING("serial", VirtIOBlock, blk.serial), 81432a877e4SStefan Hajnoczi DEFINE_PROP_BIT("config-wce", VirtIOBlock, blk.config_wce, 0, true), 81532a877e4SStefan Hajnoczi #ifdef __linux__ 81632a877e4SStefan Hajnoczi DEFINE_PROP_BIT("scsi", VirtIOBlock, blk.scsi, 0, true), 81732a877e4SStefan Hajnoczi #endif 81832a877e4SStefan Hajnoczi #ifdef CONFIG_VIRTIO_BLK_DATA_PLANE 81932a877e4SStefan Hajnoczi DEFINE_PROP_BIT("x-data-plane", VirtIOBlock, blk.data_plane, 0, false), 82032a877e4SStefan Hajnoczi #endif 8216e790746SPaolo Bonzini DEFINE_PROP_END_OF_LIST(), 8226e790746SPaolo Bonzini }; 8236e790746SPaolo Bonzini 8246e790746SPaolo Bonzini static void virtio_blk_class_init(ObjectClass *klass, void *data) 8256e790746SPaolo Bonzini { 8266e790746SPaolo Bonzini DeviceClass *dc = DEVICE_CLASS(klass); 8276e790746SPaolo Bonzini VirtioDeviceClass *vdc = VIRTIO_DEVICE_CLASS(klass); 82875884afdSAndreas Färber 8296e790746SPaolo Bonzini dc->props = virtio_blk_properties; 830125ee0edSMarcel Apfelbaum set_bit(DEVICE_CATEGORY_STORAGE, dc->categories); 83175884afdSAndreas Färber vdc->realize = virtio_blk_device_realize; 832306ec6c3SAndreas Färber vdc->unrealize = virtio_blk_device_unrealize; 8336e790746SPaolo Bonzini vdc->get_config = virtio_blk_update_config; 8346e790746SPaolo Bonzini vdc->set_config = virtio_blk_set_config; 8356e790746SPaolo Bonzini vdc->get_features = virtio_blk_get_features; 8366e790746SPaolo Bonzini vdc->set_status = virtio_blk_set_status; 8376e790746SPaolo Bonzini vdc->reset = virtio_blk_reset; 838b2b295a7SGreg Kurz vdc->save = virtio_blk_save_device; 839b2b295a7SGreg Kurz vdc->load = virtio_blk_load_device; 8406e790746SPaolo Bonzini } 8416e790746SPaolo Bonzini 8426e790746SPaolo Bonzini static const TypeInfo virtio_device_info = { 8436e790746SPaolo Bonzini .name = TYPE_VIRTIO_BLK, 8446e790746SPaolo Bonzini .parent = TYPE_VIRTIO_DEVICE, 8456e790746SPaolo Bonzini .instance_size = sizeof(VirtIOBlock), 846467b3f33SStefan Hajnoczi .instance_init = virtio_blk_instance_init, 8476e790746SPaolo Bonzini .class_init = virtio_blk_class_init, 8486e790746SPaolo Bonzini }; 8496e790746SPaolo Bonzini 8506e790746SPaolo Bonzini static void virtio_register_types(void) 8516e790746SPaolo Bonzini { 8526e790746SPaolo Bonzini type_register_static(&virtio_device_info); 8536e790746SPaolo Bonzini } 8546e790746SPaolo Bonzini 8556e790746SPaolo Bonzini type_init(virtio_register_types) 856