16e790746SPaolo Bonzini /* 26e790746SPaolo Bonzini * Virtio Block Device 36e790746SPaolo Bonzini * 46e790746SPaolo Bonzini * Copyright IBM, Corp. 2007 56e790746SPaolo Bonzini * 66e790746SPaolo Bonzini * Authors: 76e790746SPaolo Bonzini * Anthony Liguori <aliguori@us.ibm.com> 86e790746SPaolo Bonzini * 96e790746SPaolo Bonzini * This work is licensed under the terms of the GNU GPL, version 2. See 106e790746SPaolo Bonzini * the COPYING file in the top-level directory. 116e790746SPaolo Bonzini * 126e790746SPaolo Bonzini */ 136e790746SPaolo Bonzini 146e790746SPaolo Bonzini #include "qemu-common.h" 15827805a2SFam Zheng #include "qemu/iov.h" 166e790746SPaolo Bonzini #include "qemu/error-report.h" 176e790746SPaolo Bonzini #include "trace.h" 186e790746SPaolo Bonzini #include "hw/block/block.h" 196e790746SPaolo Bonzini #include "sysemu/blockdev.h" 206e790746SPaolo Bonzini #include "hw/virtio/virtio-blk.h" 216e790746SPaolo Bonzini #ifdef CONFIG_VIRTIO_BLK_DATA_PLANE 226e790746SPaolo Bonzini # include "dataplane/virtio-blk.h" 2384db52d0SStefan Hajnoczi # include "migration/migration.h" 246e790746SPaolo Bonzini #endif 256e790746SPaolo Bonzini #include "block/scsi.h" 266e790746SPaolo Bonzini #ifdef __linux__ 276e790746SPaolo Bonzini # include <scsi/sg.h> 286e790746SPaolo Bonzini #endif 296e790746SPaolo Bonzini #include "hw/virtio/virtio-bus.h" 30783d1897SRusty Russell #include "hw/virtio/virtio-access.h" 316e790746SPaolo Bonzini 32f897bf75SStefan Hajnoczi VirtIOBlockReq *virtio_blk_alloc_request(VirtIOBlock *s) 33671ec3f0SFam Zheng { 34869d66afSStefan Hajnoczi VirtIOBlockReq *req = g_slice_new(VirtIOBlockReq); 35671ec3f0SFam Zheng req->dev = s; 36869d66afSStefan Hajnoczi req->qiov.size = 0; 37869d66afSStefan Hajnoczi req->next = NULL; 38671ec3f0SFam Zheng return req; 39671ec3f0SFam Zheng } 40671ec3f0SFam Zheng 41f897bf75SStefan Hajnoczi void virtio_blk_free_request(VirtIOBlockReq *req) 42671ec3f0SFam Zheng { 43671ec3f0SFam Zheng if (req) { 44671ec3f0SFam Zheng g_slice_free(VirtIOBlockReq, req); 45671ec3f0SFam Zheng } 46671ec3f0SFam Zheng } 47671ec3f0SFam Zheng 48bf4bd461SFam Zheng static void virtio_blk_complete_request(VirtIOBlockReq *req, 49bf4bd461SFam Zheng unsigned char status) 506e790746SPaolo Bonzini { 516e790746SPaolo Bonzini VirtIOBlock *s = req->dev; 526e790746SPaolo Bonzini VirtIODevice *vdev = VIRTIO_DEVICE(s); 536e790746SPaolo Bonzini 546e790746SPaolo Bonzini trace_virtio_blk_req_complete(req, status); 556e790746SPaolo Bonzini 566e790746SPaolo Bonzini stb_p(&req->in->status, status); 57f897bf75SStefan Hajnoczi virtqueue_push(s->vq, &req->elem, req->qiov.size + sizeof(*req->in)); 586e790746SPaolo Bonzini virtio_notify(vdev, s->vq); 596e790746SPaolo Bonzini } 606e790746SPaolo Bonzini 61bf4bd461SFam Zheng static void virtio_blk_req_complete(VirtIOBlockReq *req, unsigned char status) 62bf4bd461SFam Zheng { 63bf4bd461SFam Zheng req->dev->complete_request(req, status); 64bf4bd461SFam Zheng } 65bf4bd461SFam Zheng 666e790746SPaolo Bonzini static int virtio_blk_handle_rw_error(VirtIOBlockReq *req, int error, 676e790746SPaolo Bonzini bool is_read) 686e790746SPaolo Bonzini { 696e790746SPaolo Bonzini BlockErrorAction action = bdrv_get_error_action(req->dev->bs, is_read, error); 706e790746SPaolo Bonzini VirtIOBlock *s = req->dev; 716e790746SPaolo Bonzini 72a589569fSWenchao Xia if (action == BLOCK_ERROR_ACTION_STOP) { 736e790746SPaolo Bonzini req->next = s->rq; 746e790746SPaolo Bonzini s->rq = req; 75a589569fSWenchao Xia } else if (action == BLOCK_ERROR_ACTION_REPORT) { 766e790746SPaolo Bonzini virtio_blk_req_complete(req, VIRTIO_BLK_S_IOERR); 776e790746SPaolo Bonzini bdrv_acct_done(s->bs, &req->acct); 78671ec3f0SFam Zheng virtio_blk_free_request(req); 796e790746SPaolo Bonzini } 806e790746SPaolo Bonzini 816e790746SPaolo Bonzini bdrv_error_action(s->bs, action, is_read, error); 82a589569fSWenchao Xia return action != BLOCK_ERROR_ACTION_IGNORE; 836e790746SPaolo Bonzini } 846e790746SPaolo Bonzini 856e790746SPaolo Bonzini static void virtio_blk_rw_complete(void *opaque, int ret) 866e790746SPaolo Bonzini { 876e790746SPaolo Bonzini VirtIOBlockReq *req = opaque; 886e790746SPaolo Bonzini 896e790746SPaolo Bonzini trace_virtio_blk_rw_complete(req, ret); 906e790746SPaolo Bonzini 916e790746SPaolo Bonzini if (ret) { 92783d1897SRusty Russell int p = virtio_ldl_p(VIRTIO_DEVICE(req->dev), &req->out.type); 93783d1897SRusty Russell bool is_read = !(p & VIRTIO_BLK_T_OUT); 946e790746SPaolo Bonzini if (virtio_blk_handle_rw_error(req, -ret, is_read)) 956e790746SPaolo Bonzini return; 966e790746SPaolo Bonzini } 976e790746SPaolo Bonzini 986e790746SPaolo Bonzini virtio_blk_req_complete(req, VIRTIO_BLK_S_OK); 996e790746SPaolo Bonzini bdrv_acct_done(req->dev->bs, &req->acct); 100671ec3f0SFam Zheng virtio_blk_free_request(req); 1016e790746SPaolo Bonzini } 1026e790746SPaolo Bonzini 1036e790746SPaolo Bonzini static void virtio_blk_flush_complete(void *opaque, int ret) 1046e790746SPaolo Bonzini { 1056e790746SPaolo Bonzini VirtIOBlockReq *req = opaque; 1066e790746SPaolo Bonzini 1076e790746SPaolo Bonzini if (ret) { 1086e790746SPaolo Bonzini if (virtio_blk_handle_rw_error(req, -ret, 0)) { 1096e790746SPaolo Bonzini return; 1106e790746SPaolo Bonzini } 1116e790746SPaolo Bonzini } 1126e790746SPaolo Bonzini 1136e790746SPaolo Bonzini virtio_blk_req_complete(req, VIRTIO_BLK_S_OK); 1146e790746SPaolo Bonzini bdrv_acct_done(req->dev->bs, &req->acct); 115671ec3f0SFam Zheng virtio_blk_free_request(req); 1166e790746SPaolo Bonzini } 1176e790746SPaolo Bonzini 1186e790746SPaolo Bonzini static VirtIOBlockReq *virtio_blk_get_request(VirtIOBlock *s) 1196e790746SPaolo Bonzini { 1206e790746SPaolo Bonzini VirtIOBlockReq *req = virtio_blk_alloc_request(s); 1216e790746SPaolo Bonzini 122f897bf75SStefan Hajnoczi if (!virtqueue_pop(s->vq, &req->elem)) { 123671ec3f0SFam Zheng virtio_blk_free_request(req); 1246e790746SPaolo Bonzini return NULL; 1256e790746SPaolo Bonzini } 1266e790746SPaolo Bonzini 1276e790746SPaolo Bonzini return req; 1286e790746SPaolo Bonzini } 1296e790746SPaolo Bonzini 1305a05cbeeSFam Zheng int virtio_blk_handle_scsi_req(VirtIOBlock *blk, 1315a05cbeeSFam Zheng VirtQueueElement *elem) 1326e790746SPaolo Bonzini { 1336e790746SPaolo Bonzini int status = VIRTIO_BLK_S_OK; 1345a05cbeeSFam Zheng struct virtio_scsi_inhdr *scsi = NULL; 135783d1897SRusty Russell VirtIODevice *vdev = VIRTIO_DEVICE(blk); 136783d1897SRusty Russell 1375a05cbeeSFam Zheng #ifdef __linux__ 1385a05cbeeSFam Zheng int i; 1395a05cbeeSFam Zheng struct sg_io_hdr hdr; 1405a05cbeeSFam Zheng #endif 1416e790746SPaolo Bonzini 1426e790746SPaolo Bonzini /* 1436e790746SPaolo Bonzini * We require at least one output segment each for the virtio_blk_outhdr 1446e790746SPaolo Bonzini * and the SCSI command block. 1456e790746SPaolo Bonzini * 1466e790746SPaolo Bonzini * We also at least require the virtio_blk_inhdr, the virtio_scsi_inhdr 1476e790746SPaolo Bonzini * and the sense buffer pointer in the input segments. 1486e790746SPaolo Bonzini */ 1495a05cbeeSFam Zheng if (elem->out_num < 2 || elem->in_num < 3) { 1505a05cbeeSFam Zheng status = VIRTIO_BLK_S_IOERR; 1515a05cbeeSFam Zheng goto fail; 1526e790746SPaolo Bonzini } 1536e790746SPaolo Bonzini 1546e790746SPaolo Bonzini /* 1556e790746SPaolo Bonzini * The scsi inhdr is placed in the second-to-last input segment, just 1566e790746SPaolo Bonzini * before the regular inhdr. 1576e790746SPaolo Bonzini */ 1585a05cbeeSFam Zheng scsi = (void *)elem->in_sg[elem->in_num - 2].iov_base; 1596e790746SPaolo Bonzini 1605a05cbeeSFam Zheng if (!blk->blk.scsi) { 1616e790746SPaolo Bonzini status = VIRTIO_BLK_S_UNSUPP; 1626e790746SPaolo Bonzini goto fail; 1636e790746SPaolo Bonzini } 1646e790746SPaolo Bonzini 1656e790746SPaolo Bonzini /* 1666e790746SPaolo Bonzini * No support for bidirection commands yet. 1676e790746SPaolo Bonzini */ 1685a05cbeeSFam Zheng if (elem->out_num > 2 && elem->in_num > 3) { 1696e790746SPaolo Bonzini status = VIRTIO_BLK_S_UNSUPP; 1706e790746SPaolo Bonzini goto fail; 1716e790746SPaolo Bonzini } 1726e790746SPaolo Bonzini 1736e790746SPaolo Bonzini #ifdef __linux__ 1746e790746SPaolo Bonzini memset(&hdr, 0, sizeof(struct sg_io_hdr)); 1756e790746SPaolo Bonzini hdr.interface_id = 'S'; 1765a05cbeeSFam Zheng hdr.cmd_len = elem->out_sg[1].iov_len; 1775a05cbeeSFam Zheng hdr.cmdp = elem->out_sg[1].iov_base; 1786e790746SPaolo Bonzini hdr.dxfer_len = 0; 1796e790746SPaolo Bonzini 1805a05cbeeSFam Zheng if (elem->out_num > 2) { 1816e790746SPaolo Bonzini /* 1826e790746SPaolo Bonzini * If there are more than the minimally required 2 output segments 1836e790746SPaolo Bonzini * there is write payload starting from the third iovec. 1846e790746SPaolo Bonzini */ 1856e790746SPaolo Bonzini hdr.dxfer_direction = SG_DXFER_TO_DEV; 1865a05cbeeSFam Zheng hdr.iovec_count = elem->out_num - 2; 1876e790746SPaolo Bonzini 1886e790746SPaolo Bonzini for (i = 0; i < hdr.iovec_count; i++) 1895a05cbeeSFam Zheng hdr.dxfer_len += elem->out_sg[i + 2].iov_len; 1906e790746SPaolo Bonzini 1915a05cbeeSFam Zheng hdr.dxferp = elem->out_sg + 2; 1926e790746SPaolo Bonzini 1935a05cbeeSFam Zheng } else if (elem->in_num > 3) { 1946e790746SPaolo Bonzini /* 1956e790746SPaolo Bonzini * If we have more than 3 input segments the guest wants to actually 1966e790746SPaolo Bonzini * read data. 1976e790746SPaolo Bonzini */ 1986e790746SPaolo Bonzini hdr.dxfer_direction = SG_DXFER_FROM_DEV; 1995a05cbeeSFam Zheng hdr.iovec_count = elem->in_num - 3; 2006e790746SPaolo Bonzini for (i = 0; i < hdr.iovec_count; i++) 2015a05cbeeSFam Zheng hdr.dxfer_len += elem->in_sg[i].iov_len; 2026e790746SPaolo Bonzini 2035a05cbeeSFam Zheng hdr.dxferp = elem->in_sg; 2046e790746SPaolo Bonzini } else { 2056e790746SPaolo Bonzini /* 2066e790746SPaolo Bonzini * Some SCSI commands don't actually transfer any data. 2076e790746SPaolo Bonzini */ 2086e790746SPaolo Bonzini hdr.dxfer_direction = SG_DXFER_NONE; 2096e790746SPaolo Bonzini } 2106e790746SPaolo Bonzini 2115a05cbeeSFam Zheng hdr.sbp = elem->in_sg[elem->in_num - 3].iov_base; 2125a05cbeeSFam Zheng hdr.mx_sb_len = elem->in_sg[elem->in_num - 3].iov_len; 2136e790746SPaolo Bonzini 2145a05cbeeSFam Zheng status = bdrv_ioctl(blk->bs, SG_IO, &hdr); 2155a05cbeeSFam Zheng if (status) { 2166e790746SPaolo Bonzini status = VIRTIO_BLK_S_UNSUPP; 2176e790746SPaolo Bonzini goto fail; 2186e790746SPaolo Bonzini } 2196e790746SPaolo Bonzini 2206e790746SPaolo Bonzini /* 2216e790746SPaolo Bonzini * From SCSI-Generic-HOWTO: "Some lower level drivers (e.g. ide-scsi) 2226e790746SPaolo Bonzini * clear the masked_status field [hence status gets cleared too, see 2236e790746SPaolo Bonzini * block/scsi_ioctl.c] even when a CHECK_CONDITION or COMMAND_TERMINATED 2246e790746SPaolo Bonzini * status has occurred. However they do set DRIVER_SENSE in driver_status 2256e790746SPaolo Bonzini * field. Also a (sb_len_wr > 0) indicates there is a sense buffer. 2266e790746SPaolo Bonzini */ 2276e790746SPaolo Bonzini if (hdr.status == 0 && hdr.sb_len_wr > 0) { 2286e790746SPaolo Bonzini hdr.status = CHECK_CONDITION; 2296e790746SPaolo Bonzini } 2306e790746SPaolo Bonzini 231783d1897SRusty Russell virtio_stl_p(vdev, &scsi->errors, 2326e790746SPaolo Bonzini hdr.status | (hdr.msg_status << 8) | 2336e790746SPaolo Bonzini (hdr.host_status << 16) | (hdr.driver_status << 24)); 234783d1897SRusty Russell virtio_stl_p(vdev, &scsi->residual, hdr.resid); 235783d1897SRusty Russell virtio_stl_p(vdev, &scsi->sense_len, hdr.sb_len_wr); 236783d1897SRusty Russell virtio_stl_p(vdev, &scsi->data_len, hdr.dxfer_len); 2376e790746SPaolo Bonzini 2385a05cbeeSFam Zheng return status; 2396e790746SPaolo Bonzini #else 2406e790746SPaolo Bonzini abort(); 2416e790746SPaolo Bonzini #endif 2426e790746SPaolo Bonzini 2436e790746SPaolo Bonzini fail: 2446e790746SPaolo Bonzini /* Just put anything nonzero so that the ioctl fails in the guest. */ 2455a05cbeeSFam Zheng if (scsi) { 246783d1897SRusty Russell virtio_stl_p(vdev, &scsi->errors, 255); 2475a05cbeeSFam Zheng } 2485a05cbeeSFam Zheng return status; 2495a05cbeeSFam Zheng } 2505a05cbeeSFam Zheng 2515a05cbeeSFam Zheng static void virtio_blk_handle_scsi(VirtIOBlockReq *req) 2525a05cbeeSFam Zheng { 2535a05cbeeSFam Zheng int status; 2545a05cbeeSFam Zheng 255f897bf75SStefan Hajnoczi status = virtio_blk_handle_scsi_req(req->dev, &req->elem); 2566e790746SPaolo Bonzini virtio_blk_req_complete(req, status); 257671ec3f0SFam Zheng virtio_blk_free_request(req); 2586e790746SPaolo Bonzini } 2596e790746SPaolo Bonzini 260fee65db7SFam Zheng void virtio_submit_multiwrite(BlockDriverState *bs, MultiReqBuffer *mrb) 2616e790746SPaolo Bonzini { 2626e790746SPaolo Bonzini int i, ret; 2636e790746SPaolo Bonzini 2646e790746SPaolo Bonzini if (!mrb->num_writes) { 2656e790746SPaolo Bonzini return; 2666e790746SPaolo Bonzini } 2676e790746SPaolo Bonzini 2686e790746SPaolo Bonzini ret = bdrv_aio_multiwrite(bs, mrb->blkreq, mrb->num_writes); 2696e790746SPaolo Bonzini if (ret != 0) { 2706e790746SPaolo Bonzini for (i = 0; i < mrb->num_writes; i++) { 2716e790746SPaolo Bonzini if (mrb->blkreq[i].error) { 2726e790746SPaolo Bonzini virtio_blk_rw_complete(mrb->blkreq[i].opaque, -EIO); 2736e790746SPaolo Bonzini } 2746e790746SPaolo Bonzini } 2756e790746SPaolo Bonzini } 2766e790746SPaolo Bonzini 2776e790746SPaolo Bonzini mrb->num_writes = 0; 2786e790746SPaolo Bonzini } 2796e790746SPaolo Bonzini 2806e790746SPaolo Bonzini static void virtio_blk_handle_flush(VirtIOBlockReq *req, MultiReqBuffer *mrb) 2816e790746SPaolo Bonzini { 2826e790746SPaolo Bonzini bdrv_acct_start(req->dev->bs, &req->acct, 0, BDRV_ACCT_FLUSH); 2836e790746SPaolo Bonzini 2846e790746SPaolo Bonzini /* 2856e790746SPaolo Bonzini * Make sure all outstanding writes are posted to the backing device. 2866e790746SPaolo Bonzini */ 2876e790746SPaolo Bonzini virtio_submit_multiwrite(req->dev->bs, mrb); 2886e790746SPaolo Bonzini bdrv_aio_flush(req->dev->bs, virtio_blk_flush_complete, req); 2896e790746SPaolo Bonzini } 2906e790746SPaolo Bonzini 291d0e14376SMarkus Armbruster static bool virtio_blk_sect_range_ok(VirtIOBlock *dev, 292d0e14376SMarkus Armbruster uint64_t sector, size_t size) 293d0e14376SMarkus Armbruster { 2943c2daac0SMarkus Armbruster uint64_t nb_sectors = size >> BDRV_SECTOR_BITS; 2953c2daac0SMarkus Armbruster uint64_t total_sectors; 2963c2daac0SMarkus Armbruster 297d0e14376SMarkus Armbruster if (sector & dev->sector_mask) { 298d0e14376SMarkus Armbruster return false; 299d0e14376SMarkus Armbruster } 300d0e14376SMarkus Armbruster if (size % dev->conf->logical_block_size) { 301d0e14376SMarkus Armbruster return false; 302d0e14376SMarkus Armbruster } 3033c2daac0SMarkus Armbruster bdrv_get_geometry(dev->bs, &total_sectors); 3043c2daac0SMarkus Armbruster if (sector > total_sectors || nb_sectors > total_sectors - sector) { 3053c2daac0SMarkus Armbruster return false; 3063c2daac0SMarkus Armbruster } 307d0e14376SMarkus Armbruster return true; 308d0e14376SMarkus Armbruster } 309d0e14376SMarkus Armbruster 3106e790746SPaolo Bonzini static void virtio_blk_handle_write(VirtIOBlockReq *req, MultiReqBuffer *mrb) 3116e790746SPaolo Bonzini { 3126e790746SPaolo Bonzini BlockRequest *blkreq; 3136e790746SPaolo Bonzini uint64_t sector; 3146e790746SPaolo Bonzini 315783d1897SRusty Russell sector = virtio_ldq_p(VIRTIO_DEVICE(req->dev), &req->out.sector); 3166e790746SPaolo Bonzini 3176e790746SPaolo Bonzini trace_virtio_blk_handle_write(req, sector, req->qiov.size / 512); 3186e790746SPaolo Bonzini 319d0e14376SMarkus Armbruster if (!virtio_blk_sect_range_ok(req->dev, sector, req->qiov.size)) { 32042e38c1fSMarkus Armbruster virtio_blk_req_complete(req, VIRTIO_BLK_S_IOERR); 32142e38c1fSMarkus Armbruster virtio_blk_free_request(req); 3226e790746SPaolo Bonzini return; 3236e790746SPaolo Bonzini } 3246e790746SPaolo Bonzini 32542e38c1fSMarkus Armbruster bdrv_acct_start(req->dev->bs, &req->acct, req->qiov.size, BDRV_ACCT_WRITE); 32642e38c1fSMarkus Armbruster 3276e790746SPaolo Bonzini if (mrb->num_writes == 32) { 3286e790746SPaolo Bonzini virtio_submit_multiwrite(req->dev->bs, mrb); 3296e790746SPaolo Bonzini } 3306e790746SPaolo Bonzini 3316e790746SPaolo Bonzini blkreq = &mrb->blkreq[mrb->num_writes]; 3326e790746SPaolo Bonzini blkreq->sector = sector; 3336e790746SPaolo Bonzini blkreq->nb_sectors = req->qiov.size / BDRV_SECTOR_SIZE; 3346e790746SPaolo Bonzini blkreq->qiov = &req->qiov; 3356e790746SPaolo Bonzini blkreq->cb = virtio_blk_rw_complete; 3366e790746SPaolo Bonzini blkreq->opaque = req; 3376e790746SPaolo Bonzini blkreq->error = 0; 3386e790746SPaolo Bonzini 3396e790746SPaolo Bonzini mrb->num_writes++; 3406e790746SPaolo Bonzini } 3416e790746SPaolo Bonzini 3426e790746SPaolo Bonzini static void virtio_blk_handle_read(VirtIOBlockReq *req) 3436e790746SPaolo Bonzini { 3446e790746SPaolo Bonzini uint64_t sector; 3456e790746SPaolo Bonzini 346783d1897SRusty Russell sector = virtio_ldq_p(VIRTIO_DEVICE(req->dev), &req->out.sector); 3476e790746SPaolo Bonzini 3486e790746SPaolo Bonzini trace_virtio_blk_handle_read(req, sector, req->qiov.size / 512); 3496e790746SPaolo Bonzini 350d0e14376SMarkus Armbruster if (!virtio_blk_sect_range_ok(req->dev, sector, req->qiov.size)) { 35142e38c1fSMarkus Armbruster virtio_blk_req_complete(req, VIRTIO_BLK_S_IOERR); 35242e38c1fSMarkus Armbruster virtio_blk_free_request(req); 3536e790746SPaolo Bonzini return; 3546e790746SPaolo Bonzini } 35542e38c1fSMarkus Armbruster 35642e38c1fSMarkus Armbruster bdrv_acct_start(req->dev->bs, &req->acct, req->qiov.size, BDRV_ACCT_READ); 3576e790746SPaolo Bonzini bdrv_aio_readv(req->dev->bs, sector, &req->qiov, 3586e790746SPaolo Bonzini req->qiov.size / BDRV_SECTOR_SIZE, 3596e790746SPaolo Bonzini virtio_blk_rw_complete, req); 3606e790746SPaolo Bonzini } 3616e790746SPaolo Bonzini 362fee65db7SFam Zheng void virtio_blk_handle_request(VirtIOBlockReq *req, MultiReqBuffer *mrb) 3636e790746SPaolo Bonzini { 3646e790746SPaolo Bonzini uint32_t type; 365f897bf75SStefan Hajnoczi struct iovec *in_iov = req->elem.in_sg; 366f897bf75SStefan Hajnoczi struct iovec *iov = req->elem.out_sg; 367f897bf75SStefan Hajnoczi unsigned in_num = req->elem.in_num; 368f897bf75SStefan Hajnoczi unsigned out_num = req->elem.out_num; 3696e790746SPaolo Bonzini 370f897bf75SStefan Hajnoczi if (req->elem.out_num < 1 || req->elem.in_num < 1) { 3716e790746SPaolo Bonzini error_report("virtio-blk missing headers"); 3726e790746SPaolo Bonzini exit(1); 3736e790746SPaolo Bonzini } 3746e790746SPaolo Bonzini 375827805a2SFam Zheng if (unlikely(iov_to_buf(iov, out_num, 0, &req->out, 376827805a2SFam Zheng sizeof(req->out)) != sizeof(req->out))) { 377827805a2SFam Zheng error_report("virtio-blk request outhdr too short"); 378827805a2SFam Zheng exit(1); 379827805a2SFam Zheng } 380ee17e848SFam Zheng 381827805a2SFam Zheng iov_discard_front(&iov, &out_num, sizeof(req->out)); 382ee17e848SFam Zheng 383ee17e848SFam Zheng if (in_num < 1 || 384ee17e848SFam Zheng in_iov[in_num - 1].iov_len < sizeof(struct virtio_blk_inhdr)) { 385ee17e848SFam Zheng error_report("virtio-blk request inhdr too short"); 386ee17e848SFam Zheng exit(1); 387ee17e848SFam Zheng } 388ee17e848SFam Zheng 389ee17e848SFam Zheng req->in = (void *)in_iov[in_num - 1].iov_base 390ee17e848SFam Zheng + in_iov[in_num - 1].iov_len 391ee17e848SFam Zheng - sizeof(struct virtio_blk_inhdr); 392ee17e848SFam Zheng iov_discard_back(in_iov, &in_num, sizeof(struct virtio_blk_inhdr)); 3936e790746SPaolo Bonzini 394783d1897SRusty Russell type = virtio_ldl_p(VIRTIO_DEVICE(req->dev), &req->out.type); 3956e790746SPaolo Bonzini 3966e790746SPaolo Bonzini if (type & VIRTIO_BLK_T_FLUSH) { 3976e790746SPaolo Bonzini virtio_blk_handle_flush(req, mrb); 3986e790746SPaolo Bonzini } else if (type & VIRTIO_BLK_T_SCSI_CMD) { 3996e790746SPaolo Bonzini virtio_blk_handle_scsi(req); 4006e790746SPaolo Bonzini } else if (type & VIRTIO_BLK_T_GET_ID) { 4016e790746SPaolo Bonzini VirtIOBlock *s = req->dev; 4026e790746SPaolo Bonzini 4036e790746SPaolo Bonzini /* 4046e790746SPaolo Bonzini * NB: per existing s/n string convention the string is 4056e790746SPaolo Bonzini * terminated by '\0' only when shorter than buffer. 4066e790746SPaolo Bonzini */ 407a83ceea8SMarc Marí const char *serial = s->blk.serial ? s->blk.serial : ""; 408a83ceea8SMarc Marí size_t size = MIN(strlen(serial) + 1, 409a83ceea8SMarc Marí MIN(iov_size(in_iov, in_num), 410a83ceea8SMarc Marí VIRTIO_BLK_ID_BYTES)); 411a83ceea8SMarc Marí iov_from_buf(in_iov, in_num, 0, serial, size); 4126e790746SPaolo Bonzini virtio_blk_req_complete(req, VIRTIO_BLK_S_OK); 413671ec3f0SFam Zheng virtio_blk_free_request(req); 4146e790746SPaolo Bonzini } else if (type & VIRTIO_BLK_T_OUT) { 415a83ceea8SMarc Marí qemu_iovec_init_external(&req->qiov, iov, out_num); 4166e790746SPaolo Bonzini virtio_blk_handle_write(req, mrb); 4176e790746SPaolo Bonzini } else if (type == VIRTIO_BLK_T_IN || type == VIRTIO_BLK_T_BARRIER) { 4186e790746SPaolo Bonzini /* VIRTIO_BLK_T_IN is 0, so we can't just & it. */ 419a83ceea8SMarc Marí qemu_iovec_init_external(&req->qiov, in_iov, in_num); 4206e790746SPaolo Bonzini virtio_blk_handle_read(req); 4216e790746SPaolo Bonzini } else { 4226e790746SPaolo Bonzini virtio_blk_req_complete(req, VIRTIO_BLK_S_UNSUPP); 423671ec3f0SFam Zheng virtio_blk_free_request(req); 4246e790746SPaolo Bonzini } 4256e790746SPaolo Bonzini } 4266e790746SPaolo Bonzini 4276e790746SPaolo Bonzini static void virtio_blk_handle_output(VirtIODevice *vdev, VirtQueue *vq) 4286e790746SPaolo Bonzini { 4296e790746SPaolo Bonzini VirtIOBlock *s = VIRTIO_BLK(vdev); 4306e790746SPaolo Bonzini VirtIOBlockReq *req; 4316e790746SPaolo Bonzini MultiReqBuffer mrb = { 4326e790746SPaolo Bonzini .num_writes = 0, 4336e790746SPaolo Bonzini }; 4346e790746SPaolo Bonzini 4356e790746SPaolo Bonzini #ifdef CONFIG_VIRTIO_BLK_DATA_PLANE 4366e790746SPaolo Bonzini /* Some guests kick before setting VIRTIO_CONFIG_S_DRIVER_OK so start 4376e790746SPaolo Bonzini * dataplane here instead of waiting for .set_status(). 4386e790746SPaolo Bonzini */ 4396e790746SPaolo Bonzini if (s->dataplane) { 4406e790746SPaolo Bonzini virtio_blk_data_plane_start(s->dataplane); 4416e790746SPaolo Bonzini return; 4426e790746SPaolo Bonzini } 4436e790746SPaolo Bonzini #endif 4446e790746SPaolo Bonzini 4456e790746SPaolo Bonzini while ((req = virtio_blk_get_request(s))) { 4466e790746SPaolo Bonzini virtio_blk_handle_request(req, &mrb); 4476e790746SPaolo Bonzini } 4486e790746SPaolo Bonzini 4496e790746SPaolo Bonzini virtio_submit_multiwrite(s->bs, &mrb); 4506e790746SPaolo Bonzini 4516e790746SPaolo Bonzini /* 4526e790746SPaolo Bonzini * FIXME: Want to check for completions before returning to guest mode, 4536e790746SPaolo Bonzini * so cached reads and writes are reported as quickly as possible. But 4546e790746SPaolo Bonzini * that should be done in the generic block layer. 4556e790746SPaolo Bonzini */ 4566e790746SPaolo Bonzini } 4576e790746SPaolo Bonzini 4586e790746SPaolo Bonzini static void virtio_blk_dma_restart_bh(void *opaque) 4596e790746SPaolo Bonzini { 4606e790746SPaolo Bonzini VirtIOBlock *s = opaque; 4616e790746SPaolo Bonzini VirtIOBlockReq *req = s->rq; 4626e790746SPaolo Bonzini MultiReqBuffer mrb = { 4636e790746SPaolo Bonzini .num_writes = 0, 4646e790746SPaolo Bonzini }; 4656e790746SPaolo Bonzini 4666e790746SPaolo Bonzini qemu_bh_delete(s->bh); 4676e790746SPaolo Bonzini s->bh = NULL; 4686e790746SPaolo Bonzini 4696e790746SPaolo Bonzini s->rq = NULL; 4706e790746SPaolo Bonzini 4716e790746SPaolo Bonzini while (req) { 472*1bdb176aSzhanghailiang VirtIOBlockReq *next = req->next; 4736e790746SPaolo Bonzini virtio_blk_handle_request(req, &mrb); 474*1bdb176aSzhanghailiang req = next; 4756e790746SPaolo Bonzini } 4766e790746SPaolo Bonzini 4776e790746SPaolo Bonzini virtio_submit_multiwrite(s->bs, &mrb); 4786e790746SPaolo Bonzini } 4796e790746SPaolo Bonzini 4806e790746SPaolo Bonzini static void virtio_blk_dma_restart_cb(void *opaque, int running, 4816e790746SPaolo Bonzini RunState state) 4826e790746SPaolo Bonzini { 4836e790746SPaolo Bonzini VirtIOBlock *s = opaque; 4846e790746SPaolo Bonzini 4856e790746SPaolo Bonzini if (!running) { 4866e790746SPaolo Bonzini return; 4876e790746SPaolo Bonzini } 4886e790746SPaolo Bonzini 4896e790746SPaolo Bonzini if (!s->bh) { 4904407c1c5SFam Zheng s->bh = aio_bh_new(bdrv_get_aio_context(s->blk.conf.bs), 4914407c1c5SFam Zheng virtio_blk_dma_restart_bh, s); 4926e790746SPaolo Bonzini qemu_bh_schedule(s->bh); 4936e790746SPaolo Bonzini } 4946e790746SPaolo Bonzini } 4956e790746SPaolo Bonzini 4966e790746SPaolo Bonzini static void virtio_blk_reset(VirtIODevice *vdev) 4976e790746SPaolo Bonzini { 4986e790746SPaolo Bonzini VirtIOBlock *s = VIRTIO_BLK(vdev); 4996e790746SPaolo Bonzini 500ef5bc962SPaolo Bonzini #ifdef CONFIG_VIRTIO_BLK_DATA_PLANE 5016e790746SPaolo Bonzini if (s->dataplane) { 5026e790746SPaolo Bonzini virtio_blk_data_plane_stop(s->dataplane); 5036e790746SPaolo Bonzini } 5046e790746SPaolo Bonzini #endif 5056e790746SPaolo Bonzini 5066e790746SPaolo Bonzini /* 5076e790746SPaolo Bonzini * This should cancel pending requests, but can't do nicely until there 5086e790746SPaolo Bonzini * are per-device request lists. 5096e790746SPaolo Bonzini */ 5106e790746SPaolo Bonzini bdrv_drain_all(); 511ef5bc962SPaolo Bonzini bdrv_set_enable_write_cache(s->bs, s->original_wce); 5126e790746SPaolo Bonzini } 5136e790746SPaolo Bonzini 5146e790746SPaolo Bonzini /* coalesce internal state, copy to pci i/o region 0 5156e790746SPaolo Bonzini */ 5166e790746SPaolo Bonzini static void virtio_blk_update_config(VirtIODevice *vdev, uint8_t *config) 5176e790746SPaolo Bonzini { 5186e790746SPaolo Bonzini VirtIOBlock *s = VIRTIO_BLK(vdev); 5196e790746SPaolo Bonzini struct virtio_blk_config blkcfg; 5206e790746SPaolo Bonzini uint64_t capacity; 5216e790746SPaolo Bonzini int blk_size = s->conf->logical_block_size; 5226e790746SPaolo Bonzini 5236e790746SPaolo Bonzini bdrv_get_geometry(s->bs, &capacity); 5246e790746SPaolo Bonzini memset(&blkcfg, 0, sizeof(blkcfg)); 525783d1897SRusty Russell virtio_stq_p(vdev, &blkcfg.capacity, capacity); 526783d1897SRusty Russell virtio_stl_p(vdev, &blkcfg.seg_max, 128 - 2); 527783d1897SRusty Russell virtio_stw_p(vdev, &blkcfg.cylinders, s->conf->cyls); 528783d1897SRusty Russell virtio_stl_p(vdev, &blkcfg.blk_size, blk_size); 529783d1897SRusty Russell virtio_stw_p(vdev, &blkcfg.min_io_size, s->conf->min_io_size / blk_size); 530783d1897SRusty Russell virtio_stw_p(vdev, &blkcfg.opt_io_size, s->conf->opt_io_size / blk_size); 5316e790746SPaolo Bonzini blkcfg.heads = s->conf->heads; 5326e790746SPaolo Bonzini /* 5336e790746SPaolo Bonzini * We must ensure that the block device capacity is a multiple of 534e03ba136SPeter Maydell * the logical block size. If that is not the case, let's use 5356e790746SPaolo Bonzini * sector_mask to adopt the geometry to have a correct picture. 5366e790746SPaolo Bonzini * For those devices where the capacity is ok for the given geometry 537e03ba136SPeter Maydell * we don't touch the sector value of the geometry, since some devices 5386e790746SPaolo Bonzini * (like s390 dasd) need a specific value. Here the capacity is already 5396e790746SPaolo Bonzini * cyls*heads*secs*blk_size and the sector value is not block size 5406e790746SPaolo Bonzini * divided by 512 - instead it is the amount of blk_size blocks 5416e790746SPaolo Bonzini * per track (cylinder). 5426e790746SPaolo Bonzini */ 5436e790746SPaolo Bonzini if (bdrv_getlength(s->bs) / s->conf->heads / s->conf->secs % blk_size) { 5446e790746SPaolo Bonzini blkcfg.sectors = s->conf->secs & ~s->sector_mask; 5456e790746SPaolo Bonzini } else { 5466e790746SPaolo Bonzini blkcfg.sectors = s->conf->secs; 5476e790746SPaolo Bonzini } 5486e790746SPaolo Bonzini blkcfg.size_max = 0; 5496e790746SPaolo Bonzini blkcfg.physical_block_exp = get_physical_block_exp(s->conf); 5506e790746SPaolo Bonzini blkcfg.alignment_offset = 0; 5516e790746SPaolo Bonzini blkcfg.wce = bdrv_enable_write_cache(s->bs); 5526e790746SPaolo Bonzini memcpy(config, &blkcfg, sizeof(struct virtio_blk_config)); 5536e790746SPaolo Bonzini } 5546e790746SPaolo Bonzini 5556e790746SPaolo Bonzini static void virtio_blk_set_config(VirtIODevice *vdev, const uint8_t *config) 5566e790746SPaolo Bonzini { 5576e790746SPaolo Bonzini VirtIOBlock *s = VIRTIO_BLK(vdev); 5586e790746SPaolo Bonzini struct virtio_blk_config blkcfg; 5596e790746SPaolo Bonzini 5606e790746SPaolo Bonzini memcpy(&blkcfg, config, sizeof(blkcfg)); 5616d7e73d6SFam Zheng 5626d7e73d6SFam Zheng aio_context_acquire(bdrv_get_aio_context(s->bs)); 5636e790746SPaolo Bonzini bdrv_set_enable_write_cache(s->bs, blkcfg.wce != 0); 5646d7e73d6SFam Zheng aio_context_release(bdrv_get_aio_context(s->bs)); 5656e790746SPaolo Bonzini } 5666e790746SPaolo Bonzini 5676e790746SPaolo Bonzini static uint32_t virtio_blk_get_features(VirtIODevice *vdev, uint32_t features) 5686e790746SPaolo Bonzini { 5696e790746SPaolo Bonzini VirtIOBlock *s = VIRTIO_BLK(vdev); 5706e790746SPaolo Bonzini 5716e790746SPaolo Bonzini features |= (1 << VIRTIO_BLK_F_SEG_MAX); 5726e790746SPaolo Bonzini features |= (1 << VIRTIO_BLK_F_GEOMETRY); 5736e790746SPaolo Bonzini features |= (1 << VIRTIO_BLK_F_TOPOLOGY); 5746e790746SPaolo Bonzini features |= (1 << VIRTIO_BLK_F_BLK_SIZE); 5756e790746SPaolo Bonzini features |= (1 << VIRTIO_BLK_F_SCSI); 5766e790746SPaolo Bonzini 5776e790746SPaolo Bonzini if (s->blk.config_wce) { 5786e790746SPaolo Bonzini features |= (1 << VIRTIO_BLK_F_CONFIG_WCE); 5796e790746SPaolo Bonzini } 5806e790746SPaolo Bonzini if (bdrv_enable_write_cache(s->bs)) 5816e790746SPaolo Bonzini features |= (1 << VIRTIO_BLK_F_WCE); 5826e790746SPaolo Bonzini 5836e790746SPaolo Bonzini if (bdrv_is_read_only(s->bs)) 5846e790746SPaolo Bonzini features |= 1 << VIRTIO_BLK_F_RO; 5856e790746SPaolo Bonzini 5866e790746SPaolo Bonzini return features; 5876e790746SPaolo Bonzini } 5886e790746SPaolo Bonzini 5896e790746SPaolo Bonzini static void virtio_blk_set_status(VirtIODevice *vdev, uint8_t status) 5906e790746SPaolo Bonzini { 5916e790746SPaolo Bonzini VirtIOBlock *s = VIRTIO_BLK(vdev); 5926e790746SPaolo Bonzini uint32_t features; 5936e790746SPaolo Bonzini 5946e790746SPaolo Bonzini #ifdef CONFIG_VIRTIO_BLK_DATA_PLANE 5956e790746SPaolo Bonzini if (s->dataplane && !(status & (VIRTIO_CONFIG_S_DRIVER | 5966e790746SPaolo Bonzini VIRTIO_CONFIG_S_DRIVER_OK))) { 5976e790746SPaolo Bonzini virtio_blk_data_plane_stop(s->dataplane); 5986e790746SPaolo Bonzini } 5996e790746SPaolo Bonzini #endif 6006e790746SPaolo Bonzini 6016e790746SPaolo Bonzini if (!(status & VIRTIO_CONFIG_S_DRIVER_OK)) { 6026e790746SPaolo Bonzini return; 6036e790746SPaolo Bonzini } 6046e790746SPaolo Bonzini 6056e790746SPaolo Bonzini features = vdev->guest_features; 606ef5bc962SPaolo Bonzini 607ef5bc962SPaolo Bonzini /* A guest that supports VIRTIO_BLK_F_CONFIG_WCE must be able to send 608ef5bc962SPaolo Bonzini * cache flushes. Thus, the "auto writethrough" behavior is never 609ef5bc962SPaolo Bonzini * necessary for guests that support the VIRTIO_BLK_F_CONFIG_WCE feature. 610ef5bc962SPaolo Bonzini * Leaving it enabled would break the following sequence: 611ef5bc962SPaolo Bonzini * 612ef5bc962SPaolo Bonzini * Guest started with "-drive cache=writethrough" 613ef5bc962SPaolo Bonzini * Guest sets status to 0 614ef5bc962SPaolo Bonzini * Guest sets DRIVER bit in status field 615ef5bc962SPaolo Bonzini * Guest reads host features (WCE=0, CONFIG_WCE=1) 616ef5bc962SPaolo Bonzini * Guest writes guest features (WCE=0, CONFIG_WCE=1) 617ef5bc962SPaolo Bonzini * Guest writes 1 to the WCE configuration field (writeback mode) 618ef5bc962SPaolo Bonzini * Guest sets DRIVER_OK bit in status field 619ef5bc962SPaolo Bonzini * 620ef5bc962SPaolo Bonzini * s->bs would erroneously be placed in writethrough mode. 621ef5bc962SPaolo Bonzini */ 622ef5bc962SPaolo Bonzini if (!(features & (1 << VIRTIO_BLK_F_CONFIG_WCE))) { 6236d7e73d6SFam Zheng aio_context_acquire(bdrv_get_aio_context(s->bs)); 6246d7e73d6SFam Zheng bdrv_set_enable_write_cache(s->bs, 6256d7e73d6SFam Zheng !!(features & (1 << VIRTIO_BLK_F_WCE))); 6266d7e73d6SFam Zheng aio_context_release(bdrv_get_aio_context(s->bs)); 6276e790746SPaolo Bonzini } 628ef5bc962SPaolo Bonzini } 6296e790746SPaolo Bonzini 6306e790746SPaolo Bonzini static void virtio_blk_save(QEMUFile *f, void *opaque) 6316e790746SPaolo Bonzini { 632b2b295a7SGreg Kurz VirtIODevice *vdev = VIRTIO_DEVICE(opaque); 6336e790746SPaolo Bonzini 6346e790746SPaolo Bonzini virtio_save(vdev, f); 635b2b295a7SGreg Kurz } 636b2b295a7SGreg Kurz 637b2b295a7SGreg Kurz static void virtio_blk_save_device(VirtIODevice *vdev, QEMUFile *f) 638b2b295a7SGreg Kurz { 639b2b295a7SGreg Kurz VirtIOBlock *s = VIRTIO_BLK(vdev); 640b2b295a7SGreg Kurz VirtIOBlockReq *req = s->rq; 6416e790746SPaolo Bonzini 6426e790746SPaolo Bonzini while (req) { 6436e790746SPaolo Bonzini qemu_put_sbyte(f, 1); 644f897bf75SStefan Hajnoczi qemu_put_buffer(f, (unsigned char *)&req->elem, 645671ec3f0SFam Zheng sizeof(VirtQueueElement)); 6466e790746SPaolo Bonzini req = req->next; 6476e790746SPaolo Bonzini } 6486e790746SPaolo Bonzini qemu_put_sbyte(f, 0); 6496e790746SPaolo Bonzini } 6506e790746SPaolo Bonzini 6516e790746SPaolo Bonzini static int virtio_blk_load(QEMUFile *f, void *opaque, int version_id) 6526e790746SPaolo Bonzini { 6536e790746SPaolo Bonzini VirtIOBlock *s = opaque; 6546e790746SPaolo Bonzini VirtIODevice *vdev = VIRTIO_DEVICE(s); 6556e790746SPaolo Bonzini 6566e790746SPaolo Bonzini if (version_id != 2) 6576e790746SPaolo Bonzini return -EINVAL; 6586e790746SPaolo Bonzini 659b2b295a7SGreg Kurz return virtio_load(vdev, f, version_id); 6606e790746SPaolo Bonzini } 6616e790746SPaolo Bonzini 662b2b295a7SGreg Kurz static int virtio_blk_load_device(VirtIODevice *vdev, QEMUFile *f, 663b2b295a7SGreg Kurz int version_id) 664b2b295a7SGreg Kurz { 665b2b295a7SGreg Kurz VirtIOBlock *s = VIRTIO_BLK(vdev); 666b2b295a7SGreg Kurz 6676e790746SPaolo Bonzini while (qemu_get_sbyte(f)) { 6686e790746SPaolo Bonzini VirtIOBlockReq *req = virtio_blk_alloc_request(s); 669f897bf75SStefan Hajnoczi qemu_get_buffer(f, (unsigned char *)&req->elem, 670671ec3f0SFam Zheng sizeof(VirtQueueElement)); 6716e790746SPaolo Bonzini req->next = s->rq; 6726e790746SPaolo Bonzini s->rq = req; 6736e790746SPaolo Bonzini 674f897bf75SStefan Hajnoczi virtqueue_map_sg(req->elem.in_sg, req->elem.in_addr, 675f897bf75SStefan Hajnoczi req->elem.in_num, 1); 676f897bf75SStefan Hajnoczi virtqueue_map_sg(req->elem.out_sg, req->elem.out_addr, 677f897bf75SStefan Hajnoczi req->elem.out_num, 0); 6786e790746SPaolo Bonzini } 6796e790746SPaolo Bonzini 6806e790746SPaolo Bonzini return 0; 6816e790746SPaolo Bonzini } 6826e790746SPaolo Bonzini 6836e790746SPaolo Bonzini static void virtio_blk_resize(void *opaque) 6846e790746SPaolo Bonzini { 6856e790746SPaolo Bonzini VirtIODevice *vdev = VIRTIO_DEVICE(opaque); 6866e790746SPaolo Bonzini 6876e790746SPaolo Bonzini virtio_notify_config(vdev); 6886e790746SPaolo Bonzini } 6896e790746SPaolo Bonzini 6906e790746SPaolo Bonzini static const BlockDevOps virtio_block_ops = { 6916e790746SPaolo Bonzini .resize_cb = virtio_blk_resize, 6926e790746SPaolo Bonzini }; 6936e790746SPaolo Bonzini 69484db52d0SStefan Hajnoczi #ifdef CONFIG_VIRTIO_BLK_DATA_PLANE 69584db52d0SStefan Hajnoczi /* Disable dataplane thread during live migration since it does not 69684db52d0SStefan Hajnoczi * update the dirty memory bitmap yet. 69784db52d0SStefan Hajnoczi */ 69884db52d0SStefan Hajnoczi static void virtio_blk_migration_state_changed(Notifier *notifier, void *data) 69984db52d0SStefan Hajnoczi { 70084db52d0SStefan Hajnoczi VirtIOBlock *s = container_of(notifier, VirtIOBlock, 70184db52d0SStefan Hajnoczi migration_state_notifier); 70284db52d0SStefan Hajnoczi MigrationState *mig = data; 7033ffeeef7SAndreas Färber Error *err = NULL; 70484db52d0SStefan Hajnoczi 70584db52d0SStefan Hajnoczi if (migration_in_setup(mig)) { 70684db52d0SStefan Hajnoczi if (!s->dataplane) { 70784db52d0SStefan Hajnoczi return; 70884db52d0SStefan Hajnoczi } 70984db52d0SStefan Hajnoczi virtio_blk_data_plane_destroy(s->dataplane); 71084db52d0SStefan Hajnoczi s->dataplane = NULL; 71184db52d0SStefan Hajnoczi } else if (migration_has_finished(mig) || 71284db52d0SStefan Hajnoczi migration_has_failed(mig)) { 71384db52d0SStefan Hajnoczi if (s->dataplane) { 71484db52d0SStefan Hajnoczi return; 71584db52d0SStefan Hajnoczi } 71684db52d0SStefan Hajnoczi bdrv_drain_all(); /* complete in-flight non-dataplane requests */ 71784db52d0SStefan Hajnoczi virtio_blk_data_plane_create(VIRTIO_DEVICE(s), &s->blk, 7183ffeeef7SAndreas Färber &s->dataplane, &err); 7193ffeeef7SAndreas Färber if (err != NULL) { 7203ffeeef7SAndreas Färber error_report("%s", error_get_pretty(err)); 7213ffeeef7SAndreas Färber error_free(err); 7223ffeeef7SAndreas Färber } 72384db52d0SStefan Hajnoczi } 72484db52d0SStefan Hajnoczi } 72584db52d0SStefan Hajnoczi #endif /* CONFIG_VIRTIO_BLK_DATA_PLANE */ 72684db52d0SStefan Hajnoczi 72775884afdSAndreas Färber static void virtio_blk_device_realize(DeviceState *dev, Error **errp) 7286e790746SPaolo Bonzini { 72975884afdSAndreas Färber VirtIODevice *vdev = VIRTIO_DEVICE(dev); 730179b417eSAndreas Färber VirtIOBlock *s = VIRTIO_BLK(dev); 7316e790746SPaolo Bonzini VirtIOBlkConf *blk = &(s->blk); 7323ffeeef7SAndreas Färber #ifdef CONFIG_VIRTIO_BLK_DATA_PLANE 7333ffeeef7SAndreas Färber Error *err = NULL; 7343ffeeef7SAndreas Färber #endif 7356e790746SPaolo Bonzini static int virtio_blk_id; 7366e790746SPaolo Bonzini 7376e790746SPaolo Bonzini if (!blk->conf.bs) { 73875884afdSAndreas Färber error_setg(errp, "drive property not set"); 73975884afdSAndreas Färber return; 7406e790746SPaolo Bonzini } 7416e790746SPaolo Bonzini if (!bdrv_is_inserted(blk->conf.bs)) { 74275884afdSAndreas Färber error_setg(errp, "Device needs media, but drive is empty"); 74375884afdSAndreas Färber return; 7446e790746SPaolo Bonzini } 7456e790746SPaolo Bonzini 7466e790746SPaolo Bonzini blkconf_serial(&blk->conf, &blk->serial); 747ef5bc962SPaolo Bonzini s->original_wce = bdrv_enable_write_cache(blk->conf.bs); 7486e790746SPaolo Bonzini if (blkconf_geometry(&blk->conf, NULL, 65535, 255, 255) < 0) { 74975884afdSAndreas Färber error_setg(errp, "Error setting geometry"); 75075884afdSAndreas Färber return; 7516e790746SPaolo Bonzini } 7526e790746SPaolo Bonzini 7536e790746SPaolo Bonzini virtio_init(vdev, "virtio-blk", VIRTIO_ID_BLOCK, 7546e790746SPaolo Bonzini sizeof(struct virtio_blk_config)); 7556e790746SPaolo Bonzini 7566e790746SPaolo Bonzini s->bs = blk->conf.bs; 7576e790746SPaolo Bonzini s->conf = &blk->conf; 7586e790746SPaolo Bonzini s->rq = NULL; 7596e790746SPaolo Bonzini s->sector_mask = (s->conf->logical_block_size / BDRV_SECTOR_SIZE) - 1; 7606e790746SPaolo Bonzini 7616e790746SPaolo Bonzini s->vq = virtio_add_queue(vdev, 128, virtio_blk_handle_output); 762bf4bd461SFam Zheng s->complete_request = virtio_blk_complete_request; 7636e790746SPaolo Bonzini #ifdef CONFIG_VIRTIO_BLK_DATA_PLANE 7643ffeeef7SAndreas Färber virtio_blk_data_plane_create(vdev, blk, &s->dataplane, &err); 7653ffeeef7SAndreas Färber if (err != NULL) { 76675884afdSAndreas Färber error_propagate(errp, err); 7676a1a8cc7SKONRAD Frederic virtio_cleanup(vdev); 76875884afdSAndreas Färber return; 7696e790746SPaolo Bonzini } 77084db52d0SStefan Hajnoczi s->migration_state_notifier.notify = virtio_blk_migration_state_changed; 77184db52d0SStefan Hajnoczi add_migration_state_change_notifier(&s->migration_state_notifier); 7726e790746SPaolo Bonzini #endif 7736e790746SPaolo Bonzini 7746e790746SPaolo Bonzini s->change = qemu_add_vm_change_state_handler(virtio_blk_dma_restart_cb, s); 775179b417eSAndreas Färber register_savevm(dev, "virtio-blk", virtio_blk_id++, 2, 7766e790746SPaolo Bonzini virtio_blk_save, virtio_blk_load, s); 7776e790746SPaolo Bonzini bdrv_set_dev_ops(s->bs, &virtio_block_ops, s); 7781b7fd729SPaolo Bonzini bdrv_set_guest_block_size(s->bs, s->conf->logical_block_size); 7796e790746SPaolo Bonzini 7806e790746SPaolo Bonzini bdrv_iostatus_enable(s->bs); 7816e790746SPaolo Bonzini 782179b417eSAndreas Färber add_boot_device_path(s->conf->bootindex, dev, "/disk@0,0"); 7836e790746SPaolo Bonzini } 7846e790746SPaolo Bonzini 785306ec6c3SAndreas Färber static void virtio_blk_device_unrealize(DeviceState *dev, Error **errp) 7866e790746SPaolo Bonzini { 787306ec6c3SAndreas Färber VirtIODevice *vdev = VIRTIO_DEVICE(dev); 788306ec6c3SAndreas Färber VirtIOBlock *s = VIRTIO_BLK(dev); 789306ec6c3SAndreas Färber 7906e790746SPaolo Bonzini #ifdef CONFIG_VIRTIO_BLK_DATA_PLANE 79184db52d0SStefan Hajnoczi remove_migration_state_change_notifier(&s->migration_state_notifier); 7926e790746SPaolo Bonzini virtio_blk_data_plane_destroy(s->dataplane); 7936e790746SPaolo Bonzini s->dataplane = NULL; 7946e790746SPaolo Bonzini #endif 7956e790746SPaolo Bonzini qemu_del_vm_change_state_handler(s->change); 796306ec6c3SAndreas Färber unregister_savevm(dev, "virtio-blk", s); 7976e790746SPaolo Bonzini blockdev_mark_auto_del(s->bs); 7986a1a8cc7SKONRAD Frederic virtio_cleanup(vdev); 7996e790746SPaolo Bonzini } 8006e790746SPaolo Bonzini 801467b3f33SStefan Hajnoczi static void virtio_blk_instance_init(Object *obj) 802467b3f33SStefan Hajnoczi { 803467b3f33SStefan Hajnoczi VirtIOBlock *s = VIRTIO_BLK(obj); 804467b3f33SStefan Hajnoczi 805467b3f33SStefan Hajnoczi object_property_add_link(obj, "iothread", TYPE_IOTHREAD, 806467b3f33SStefan Hajnoczi (Object **)&s->blk.iothread, 807467b3f33SStefan Hajnoczi qdev_prop_allow_set_link_before_realize, 808467b3f33SStefan Hajnoczi OBJ_PROP_LINK_UNREF_ON_RELEASE, NULL); 809467b3f33SStefan Hajnoczi } 810467b3f33SStefan Hajnoczi 8116e790746SPaolo Bonzini static Property virtio_blk_properties[] = { 81232a877e4SStefan Hajnoczi DEFINE_BLOCK_PROPERTIES(VirtIOBlock, blk.conf), 81332a877e4SStefan Hajnoczi DEFINE_BLOCK_CHS_PROPERTIES(VirtIOBlock, blk.conf), 81432a877e4SStefan Hajnoczi DEFINE_PROP_STRING("serial", VirtIOBlock, blk.serial), 81532a877e4SStefan Hajnoczi DEFINE_PROP_BIT("config-wce", VirtIOBlock, blk.config_wce, 0, true), 81632a877e4SStefan Hajnoczi #ifdef __linux__ 81732a877e4SStefan Hajnoczi DEFINE_PROP_BIT("scsi", VirtIOBlock, blk.scsi, 0, true), 81832a877e4SStefan Hajnoczi #endif 81932a877e4SStefan Hajnoczi #ifdef CONFIG_VIRTIO_BLK_DATA_PLANE 82032a877e4SStefan Hajnoczi DEFINE_PROP_BIT("x-data-plane", VirtIOBlock, blk.data_plane, 0, false), 82132a877e4SStefan Hajnoczi #endif 8226e790746SPaolo Bonzini DEFINE_PROP_END_OF_LIST(), 8236e790746SPaolo Bonzini }; 8246e790746SPaolo Bonzini 8256e790746SPaolo Bonzini static void virtio_blk_class_init(ObjectClass *klass, void *data) 8266e790746SPaolo Bonzini { 8276e790746SPaolo Bonzini DeviceClass *dc = DEVICE_CLASS(klass); 8286e790746SPaolo Bonzini VirtioDeviceClass *vdc = VIRTIO_DEVICE_CLASS(klass); 82975884afdSAndreas Färber 8306e790746SPaolo Bonzini dc->props = virtio_blk_properties; 831125ee0edSMarcel Apfelbaum set_bit(DEVICE_CATEGORY_STORAGE, dc->categories); 83275884afdSAndreas Färber vdc->realize = virtio_blk_device_realize; 833306ec6c3SAndreas Färber vdc->unrealize = virtio_blk_device_unrealize; 8346e790746SPaolo Bonzini vdc->get_config = virtio_blk_update_config; 8356e790746SPaolo Bonzini vdc->set_config = virtio_blk_set_config; 8366e790746SPaolo Bonzini vdc->get_features = virtio_blk_get_features; 8376e790746SPaolo Bonzini vdc->set_status = virtio_blk_set_status; 8386e790746SPaolo Bonzini vdc->reset = virtio_blk_reset; 839b2b295a7SGreg Kurz vdc->save = virtio_blk_save_device; 840b2b295a7SGreg Kurz vdc->load = virtio_blk_load_device; 8416e790746SPaolo Bonzini } 8426e790746SPaolo Bonzini 8436e790746SPaolo Bonzini static const TypeInfo virtio_device_info = { 8446e790746SPaolo Bonzini .name = TYPE_VIRTIO_BLK, 8456e790746SPaolo Bonzini .parent = TYPE_VIRTIO_DEVICE, 8466e790746SPaolo Bonzini .instance_size = sizeof(VirtIOBlock), 847467b3f33SStefan Hajnoczi .instance_init = virtio_blk_instance_init, 8486e790746SPaolo Bonzini .class_init = virtio_blk_class_init, 8496e790746SPaolo Bonzini }; 8506e790746SPaolo Bonzini 8516e790746SPaolo Bonzini static void virtio_register_types(void) 8526e790746SPaolo Bonzini { 8536e790746SPaolo Bonzini type_register_static(&virtio_device_info); 8546e790746SPaolo Bonzini } 8556e790746SPaolo Bonzini 8566e790746SPaolo Bonzini type_init(virtio_register_types) 857