16e790746SPaolo Bonzini /* 26e790746SPaolo Bonzini * Virtio Block Device 36e790746SPaolo Bonzini * 46e790746SPaolo Bonzini * Copyright IBM, Corp. 2007 56e790746SPaolo Bonzini * 66e790746SPaolo Bonzini * Authors: 76e790746SPaolo Bonzini * Anthony Liguori <aliguori@us.ibm.com> 86e790746SPaolo Bonzini * 96e790746SPaolo Bonzini * This work is licensed under the terms of the GNU GPL, version 2. See 106e790746SPaolo Bonzini * the COPYING file in the top-level directory. 116e790746SPaolo Bonzini * 126e790746SPaolo Bonzini */ 136e790746SPaolo Bonzini 146e790746SPaolo Bonzini #include "qemu-common.h" 15827805a2SFam Zheng #include "qemu/iov.h" 166e790746SPaolo Bonzini #include "qemu/error-report.h" 176e790746SPaolo Bonzini #include "trace.h" 186e790746SPaolo Bonzini #include "hw/block/block.h" 196e790746SPaolo Bonzini #include "sysemu/blockdev.h" 206e790746SPaolo Bonzini #include "hw/virtio/virtio-blk.h" 216e790746SPaolo Bonzini #include "dataplane/virtio-blk.h" 2284db52d0SStefan Hajnoczi #include "migration/migration.h" 236e790746SPaolo Bonzini #include "block/scsi.h" 246e790746SPaolo Bonzini #ifdef __linux__ 256e790746SPaolo Bonzini # include <scsi/sg.h> 266e790746SPaolo Bonzini #endif 276e790746SPaolo Bonzini #include "hw/virtio/virtio-bus.h" 28783d1897SRusty Russell #include "hw/virtio/virtio-access.h" 296e790746SPaolo Bonzini 30f897bf75SStefan Hajnoczi VirtIOBlockReq *virtio_blk_alloc_request(VirtIOBlock *s) 31671ec3f0SFam Zheng { 32869d66afSStefan Hajnoczi VirtIOBlockReq *req = g_slice_new(VirtIOBlockReq); 33671ec3f0SFam Zheng req->dev = s; 34869d66afSStefan Hajnoczi req->qiov.size = 0; 35869d66afSStefan Hajnoczi req->next = NULL; 36671ec3f0SFam Zheng return req; 37671ec3f0SFam Zheng } 38671ec3f0SFam Zheng 39f897bf75SStefan Hajnoczi void virtio_blk_free_request(VirtIOBlockReq *req) 40671ec3f0SFam Zheng { 41671ec3f0SFam Zheng if (req) { 42671ec3f0SFam Zheng g_slice_free(VirtIOBlockReq, req); 43671ec3f0SFam Zheng } 44671ec3f0SFam Zheng } 45671ec3f0SFam Zheng 46bf4bd461SFam Zheng static void virtio_blk_complete_request(VirtIOBlockReq *req, 47bf4bd461SFam Zheng unsigned char status) 486e790746SPaolo Bonzini { 496e790746SPaolo Bonzini VirtIOBlock *s = req->dev; 506e790746SPaolo Bonzini VirtIODevice *vdev = VIRTIO_DEVICE(s); 516e790746SPaolo Bonzini 526e790746SPaolo Bonzini trace_virtio_blk_req_complete(req, status); 536e790746SPaolo Bonzini 546e790746SPaolo Bonzini stb_p(&req->in->status, status); 55f897bf75SStefan Hajnoczi virtqueue_push(s->vq, &req->elem, req->qiov.size + sizeof(*req->in)); 566e790746SPaolo Bonzini virtio_notify(vdev, s->vq); 576e790746SPaolo Bonzini } 586e790746SPaolo Bonzini 59bf4bd461SFam Zheng static void virtio_blk_req_complete(VirtIOBlockReq *req, unsigned char status) 60bf4bd461SFam Zheng { 61bf4bd461SFam Zheng req->dev->complete_request(req, status); 62bf4bd461SFam Zheng } 63bf4bd461SFam Zheng 646e790746SPaolo Bonzini static int virtio_blk_handle_rw_error(VirtIOBlockReq *req, int error, 656e790746SPaolo Bonzini bool is_read) 666e790746SPaolo Bonzini { 676e790746SPaolo Bonzini BlockErrorAction action = bdrv_get_error_action(req->dev->bs, is_read, error); 686e790746SPaolo Bonzini VirtIOBlock *s = req->dev; 696e790746SPaolo Bonzini 70a589569fSWenchao Xia if (action == BLOCK_ERROR_ACTION_STOP) { 716e790746SPaolo Bonzini req->next = s->rq; 726e790746SPaolo Bonzini s->rq = req; 73a589569fSWenchao Xia } else if (action == BLOCK_ERROR_ACTION_REPORT) { 746e790746SPaolo Bonzini virtio_blk_req_complete(req, VIRTIO_BLK_S_IOERR); 755366d0c8SBenoît Canet block_acct_done(bdrv_get_stats(s->bs), &req->acct); 76671ec3f0SFam Zheng virtio_blk_free_request(req); 776e790746SPaolo Bonzini } 786e790746SPaolo Bonzini 796e790746SPaolo Bonzini bdrv_error_action(s->bs, action, is_read, error); 80a589569fSWenchao Xia return action != BLOCK_ERROR_ACTION_IGNORE; 816e790746SPaolo Bonzini } 826e790746SPaolo Bonzini 836e790746SPaolo Bonzini static void virtio_blk_rw_complete(void *opaque, int ret) 846e790746SPaolo Bonzini { 856e790746SPaolo Bonzini VirtIOBlockReq *req = opaque; 866e790746SPaolo Bonzini 876e790746SPaolo Bonzini trace_virtio_blk_rw_complete(req, ret); 886e790746SPaolo Bonzini 896e790746SPaolo Bonzini if (ret) { 90783d1897SRusty Russell int p = virtio_ldl_p(VIRTIO_DEVICE(req->dev), &req->out.type); 91783d1897SRusty Russell bool is_read = !(p & VIRTIO_BLK_T_OUT); 926e790746SPaolo Bonzini if (virtio_blk_handle_rw_error(req, -ret, is_read)) 936e790746SPaolo Bonzini return; 946e790746SPaolo Bonzini } 956e790746SPaolo Bonzini 966e790746SPaolo Bonzini virtio_blk_req_complete(req, VIRTIO_BLK_S_OK); 975366d0c8SBenoît Canet block_acct_done(bdrv_get_stats(req->dev->bs), &req->acct); 98671ec3f0SFam Zheng virtio_blk_free_request(req); 996e790746SPaolo Bonzini } 1006e790746SPaolo Bonzini 1016e790746SPaolo Bonzini static void virtio_blk_flush_complete(void *opaque, int ret) 1026e790746SPaolo Bonzini { 1036e790746SPaolo Bonzini VirtIOBlockReq *req = opaque; 1046e790746SPaolo Bonzini 1056e790746SPaolo Bonzini if (ret) { 1066e790746SPaolo Bonzini if (virtio_blk_handle_rw_error(req, -ret, 0)) { 1076e790746SPaolo Bonzini return; 1086e790746SPaolo Bonzini } 1096e790746SPaolo Bonzini } 1106e790746SPaolo Bonzini 1116e790746SPaolo Bonzini virtio_blk_req_complete(req, VIRTIO_BLK_S_OK); 1125366d0c8SBenoît Canet block_acct_done(bdrv_get_stats(req->dev->bs), &req->acct); 113671ec3f0SFam Zheng virtio_blk_free_request(req); 1146e790746SPaolo Bonzini } 1156e790746SPaolo Bonzini 1166e790746SPaolo Bonzini static VirtIOBlockReq *virtio_blk_get_request(VirtIOBlock *s) 1176e790746SPaolo Bonzini { 1186e790746SPaolo Bonzini VirtIOBlockReq *req = virtio_blk_alloc_request(s); 1196e790746SPaolo Bonzini 120f897bf75SStefan Hajnoczi if (!virtqueue_pop(s->vq, &req->elem)) { 121671ec3f0SFam Zheng virtio_blk_free_request(req); 1226e790746SPaolo Bonzini return NULL; 1236e790746SPaolo Bonzini } 1246e790746SPaolo Bonzini 1256e790746SPaolo Bonzini return req; 1266e790746SPaolo Bonzini } 1276e790746SPaolo Bonzini 1285a05cbeeSFam Zheng int virtio_blk_handle_scsi_req(VirtIOBlock *blk, 1295a05cbeeSFam Zheng VirtQueueElement *elem) 1306e790746SPaolo Bonzini { 1316e790746SPaolo Bonzini int status = VIRTIO_BLK_S_OK; 1325a05cbeeSFam Zheng struct virtio_scsi_inhdr *scsi = NULL; 133783d1897SRusty Russell VirtIODevice *vdev = VIRTIO_DEVICE(blk); 134783d1897SRusty Russell 1355a05cbeeSFam Zheng #ifdef __linux__ 1365a05cbeeSFam Zheng int i; 1375a05cbeeSFam Zheng struct sg_io_hdr hdr; 1385a05cbeeSFam Zheng #endif 1396e790746SPaolo Bonzini 1406e790746SPaolo Bonzini /* 1416e790746SPaolo Bonzini * We require at least one output segment each for the virtio_blk_outhdr 1426e790746SPaolo Bonzini * and the SCSI command block. 1436e790746SPaolo Bonzini * 1446e790746SPaolo Bonzini * We also at least require the virtio_blk_inhdr, the virtio_scsi_inhdr 1456e790746SPaolo Bonzini * and the sense buffer pointer in the input segments. 1466e790746SPaolo Bonzini */ 1475a05cbeeSFam Zheng if (elem->out_num < 2 || elem->in_num < 3) { 1485a05cbeeSFam Zheng status = VIRTIO_BLK_S_IOERR; 1495a05cbeeSFam Zheng goto fail; 1506e790746SPaolo Bonzini } 1516e790746SPaolo Bonzini 1526e790746SPaolo Bonzini /* 1536e790746SPaolo Bonzini * The scsi inhdr is placed in the second-to-last input segment, just 1546e790746SPaolo Bonzini * before the regular inhdr. 1556e790746SPaolo Bonzini */ 1565a05cbeeSFam Zheng scsi = (void *)elem->in_sg[elem->in_num - 2].iov_base; 1576e790746SPaolo Bonzini 1585a05cbeeSFam Zheng if (!blk->blk.scsi) { 1596e790746SPaolo Bonzini status = VIRTIO_BLK_S_UNSUPP; 1606e790746SPaolo Bonzini goto fail; 1616e790746SPaolo Bonzini } 1626e790746SPaolo Bonzini 1636e790746SPaolo Bonzini /* 1646e790746SPaolo Bonzini * No support for bidirection commands yet. 1656e790746SPaolo Bonzini */ 1665a05cbeeSFam Zheng if (elem->out_num > 2 && elem->in_num > 3) { 1676e790746SPaolo Bonzini status = VIRTIO_BLK_S_UNSUPP; 1686e790746SPaolo Bonzini goto fail; 1696e790746SPaolo Bonzini } 1706e790746SPaolo Bonzini 1716e790746SPaolo Bonzini #ifdef __linux__ 1726e790746SPaolo Bonzini memset(&hdr, 0, sizeof(struct sg_io_hdr)); 1736e790746SPaolo Bonzini hdr.interface_id = 'S'; 1745a05cbeeSFam Zheng hdr.cmd_len = elem->out_sg[1].iov_len; 1755a05cbeeSFam Zheng hdr.cmdp = elem->out_sg[1].iov_base; 1766e790746SPaolo Bonzini hdr.dxfer_len = 0; 1776e790746SPaolo Bonzini 1785a05cbeeSFam Zheng if (elem->out_num > 2) { 1796e790746SPaolo Bonzini /* 1806e790746SPaolo Bonzini * If there are more than the minimally required 2 output segments 1816e790746SPaolo Bonzini * there is write payload starting from the third iovec. 1826e790746SPaolo Bonzini */ 1836e790746SPaolo Bonzini hdr.dxfer_direction = SG_DXFER_TO_DEV; 1845a05cbeeSFam Zheng hdr.iovec_count = elem->out_num - 2; 1856e790746SPaolo Bonzini 1866e790746SPaolo Bonzini for (i = 0; i < hdr.iovec_count; i++) 1875a05cbeeSFam Zheng hdr.dxfer_len += elem->out_sg[i + 2].iov_len; 1886e790746SPaolo Bonzini 1895a05cbeeSFam Zheng hdr.dxferp = elem->out_sg + 2; 1906e790746SPaolo Bonzini 1915a05cbeeSFam Zheng } else if (elem->in_num > 3) { 1926e790746SPaolo Bonzini /* 1936e790746SPaolo Bonzini * If we have more than 3 input segments the guest wants to actually 1946e790746SPaolo Bonzini * read data. 1956e790746SPaolo Bonzini */ 1966e790746SPaolo Bonzini hdr.dxfer_direction = SG_DXFER_FROM_DEV; 1975a05cbeeSFam Zheng hdr.iovec_count = elem->in_num - 3; 1986e790746SPaolo Bonzini for (i = 0; i < hdr.iovec_count; i++) 1995a05cbeeSFam Zheng hdr.dxfer_len += elem->in_sg[i].iov_len; 2006e790746SPaolo Bonzini 2015a05cbeeSFam Zheng hdr.dxferp = elem->in_sg; 2026e790746SPaolo Bonzini } else { 2036e790746SPaolo Bonzini /* 2046e790746SPaolo Bonzini * Some SCSI commands don't actually transfer any data. 2056e790746SPaolo Bonzini */ 2066e790746SPaolo Bonzini hdr.dxfer_direction = SG_DXFER_NONE; 2076e790746SPaolo Bonzini } 2086e790746SPaolo Bonzini 2095a05cbeeSFam Zheng hdr.sbp = elem->in_sg[elem->in_num - 3].iov_base; 2105a05cbeeSFam Zheng hdr.mx_sb_len = elem->in_sg[elem->in_num - 3].iov_len; 2116e790746SPaolo Bonzini 2125a05cbeeSFam Zheng status = bdrv_ioctl(blk->bs, SG_IO, &hdr); 2135a05cbeeSFam Zheng if (status) { 2146e790746SPaolo Bonzini status = VIRTIO_BLK_S_UNSUPP; 2156e790746SPaolo Bonzini goto fail; 2166e790746SPaolo Bonzini } 2176e790746SPaolo Bonzini 2186e790746SPaolo Bonzini /* 2196e790746SPaolo Bonzini * From SCSI-Generic-HOWTO: "Some lower level drivers (e.g. ide-scsi) 2206e790746SPaolo Bonzini * clear the masked_status field [hence status gets cleared too, see 2216e790746SPaolo Bonzini * block/scsi_ioctl.c] even when a CHECK_CONDITION or COMMAND_TERMINATED 2226e790746SPaolo Bonzini * status has occurred. However they do set DRIVER_SENSE in driver_status 2236e790746SPaolo Bonzini * field. Also a (sb_len_wr > 0) indicates there is a sense buffer. 2246e790746SPaolo Bonzini */ 2256e790746SPaolo Bonzini if (hdr.status == 0 && hdr.sb_len_wr > 0) { 2266e790746SPaolo Bonzini hdr.status = CHECK_CONDITION; 2276e790746SPaolo Bonzini } 2286e790746SPaolo Bonzini 229783d1897SRusty Russell virtio_stl_p(vdev, &scsi->errors, 2306e790746SPaolo Bonzini hdr.status | (hdr.msg_status << 8) | 2316e790746SPaolo Bonzini (hdr.host_status << 16) | (hdr.driver_status << 24)); 232783d1897SRusty Russell virtio_stl_p(vdev, &scsi->residual, hdr.resid); 233783d1897SRusty Russell virtio_stl_p(vdev, &scsi->sense_len, hdr.sb_len_wr); 234783d1897SRusty Russell virtio_stl_p(vdev, &scsi->data_len, hdr.dxfer_len); 2356e790746SPaolo Bonzini 2365a05cbeeSFam Zheng return status; 2376e790746SPaolo Bonzini #else 2386e790746SPaolo Bonzini abort(); 2396e790746SPaolo Bonzini #endif 2406e790746SPaolo Bonzini 2416e790746SPaolo Bonzini fail: 2426e790746SPaolo Bonzini /* Just put anything nonzero so that the ioctl fails in the guest. */ 2435a05cbeeSFam Zheng if (scsi) { 244783d1897SRusty Russell virtio_stl_p(vdev, &scsi->errors, 255); 2455a05cbeeSFam Zheng } 2465a05cbeeSFam Zheng return status; 2475a05cbeeSFam Zheng } 2485a05cbeeSFam Zheng 2495a05cbeeSFam Zheng static void virtio_blk_handle_scsi(VirtIOBlockReq *req) 2505a05cbeeSFam Zheng { 2515a05cbeeSFam Zheng int status; 2525a05cbeeSFam Zheng 253f897bf75SStefan Hajnoczi status = virtio_blk_handle_scsi_req(req->dev, &req->elem); 2546e790746SPaolo Bonzini virtio_blk_req_complete(req, status); 255671ec3f0SFam Zheng virtio_blk_free_request(req); 2566e790746SPaolo Bonzini } 2576e790746SPaolo Bonzini 258fee65db7SFam Zheng void virtio_submit_multiwrite(BlockDriverState *bs, MultiReqBuffer *mrb) 2596e790746SPaolo Bonzini { 2606e790746SPaolo Bonzini int i, ret; 2616e790746SPaolo Bonzini 2626e790746SPaolo Bonzini if (!mrb->num_writes) { 2636e790746SPaolo Bonzini return; 2646e790746SPaolo Bonzini } 2656e790746SPaolo Bonzini 2666e790746SPaolo Bonzini ret = bdrv_aio_multiwrite(bs, mrb->blkreq, mrb->num_writes); 2676e790746SPaolo Bonzini if (ret != 0) { 2686e790746SPaolo Bonzini for (i = 0; i < mrb->num_writes; i++) { 2696e790746SPaolo Bonzini if (mrb->blkreq[i].error) { 2706e790746SPaolo Bonzini virtio_blk_rw_complete(mrb->blkreq[i].opaque, -EIO); 2716e790746SPaolo Bonzini } 2726e790746SPaolo Bonzini } 2736e790746SPaolo Bonzini } 2746e790746SPaolo Bonzini 2756e790746SPaolo Bonzini mrb->num_writes = 0; 2766e790746SPaolo Bonzini } 2776e790746SPaolo Bonzini 2786e790746SPaolo Bonzini static void virtio_blk_handle_flush(VirtIOBlockReq *req, MultiReqBuffer *mrb) 2796e790746SPaolo Bonzini { 2805366d0c8SBenoît Canet block_acct_start(bdrv_get_stats(req->dev->bs), &req->acct, 0, 2815366d0c8SBenoît Canet BLOCK_ACCT_FLUSH); 2826e790746SPaolo Bonzini 2836e790746SPaolo Bonzini /* 2846e790746SPaolo Bonzini * Make sure all outstanding writes are posted to the backing device. 2856e790746SPaolo Bonzini */ 2866e790746SPaolo Bonzini virtio_submit_multiwrite(req->dev->bs, mrb); 2876e790746SPaolo Bonzini bdrv_aio_flush(req->dev->bs, virtio_blk_flush_complete, req); 2886e790746SPaolo Bonzini } 2896e790746SPaolo Bonzini 290d0e14376SMarkus Armbruster static bool virtio_blk_sect_range_ok(VirtIOBlock *dev, 291d0e14376SMarkus Armbruster uint64_t sector, size_t size) 292d0e14376SMarkus Armbruster { 2933c2daac0SMarkus Armbruster uint64_t nb_sectors = size >> BDRV_SECTOR_BITS; 2943c2daac0SMarkus Armbruster uint64_t total_sectors; 2953c2daac0SMarkus Armbruster 296d0e14376SMarkus Armbruster if (sector & dev->sector_mask) { 297d0e14376SMarkus Armbruster return false; 298d0e14376SMarkus Armbruster } 299d0e14376SMarkus Armbruster if (size % dev->conf->logical_block_size) { 300d0e14376SMarkus Armbruster return false; 301d0e14376SMarkus Armbruster } 3023c2daac0SMarkus Armbruster bdrv_get_geometry(dev->bs, &total_sectors); 3033c2daac0SMarkus Armbruster if (sector > total_sectors || nb_sectors > total_sectors - sector) { 3043c2daac0SMarkus Armbruster return false; 3053c2daac0SMarkus Armbruster } 306d0e14376SMarkus Armbruster return true; 307d0e14376SMarkus Armbruster } 308d0e14376SMarkus Armbruster 3096e790746SPaolo Bonzini static void virtio_blk_handle_write(VirtIOBlockReq *req, MultiReqBuffer *mrb) 3106e790746SPaolo Bonzini { 3116e790746SPaolo Bonzini BlockRequest *blkreq; 3126e790746SPaolo Bonzini uint64_t sector; 3136e790746SPaolo Bonzini 314783d1897SRusty Russell sector = virtio_ldq_p(VIRTIO_DEVICE(req->dev), &req->out.sector); 3156e790746SPaolo Bonzini 3166e790746SPaolo Bonzini trace_virtio_blk_handle_write(req, sector, req->qiov.size / 512); 3176e790746SPaolo Bonzini 318d0e14376SMarkus Armbruster if (!virtio_blk_sect_range_ok(req->dev, sector, req->qiov.size)) { 31942e38c1fSMarkus Armbruster virtio_blk_req_complete(req, VIRTIO_BLK_S_IOERR); 32042e38c1fSMarkus Armbruster virtio_blk_free_request(req); 3216e790746SPaolo Bonzini return; 3226e790746SPaolo Bonzini } 3236e790746SPaolo Bonzini 3245366d0c8SBenoît Canet block_acct_start(bdrv_get_stats(req->dev->bs), &req->acct, req->qiov.size, 3255366d0c8SBenoît Canet BLOCK_ACCT_WRITE); 32642e38c1fSMarkus Armbruster 3276e790746SPaolo Bonzini if (mrb->num_writes == 32) { 3286e790746SPaolo Bonzini virtio_submit_multiwrite(req->dev->bs, mrb); 3296e790746SPaolo Bonzini } 3306e790746SPaolo Bonzini 3316e790746SPaolo Bonzini blkreq = &mrb->blkreq[mrb->num_writes]; 3326e790746SPaolo Bonzini blkreq->sector = sector; 3336e790746SPaolo Bonzini blkreq->nb_sectors = req->qiov.size / BDRV_SECTOR_SIZE; 3346e790746SPaolo Bonzini blkreq->qiov = &req->qiov; 3356e790746SPaolo Bonzini blkreq->cb = virtio_blk_rw_complete; 3366e790746SPaolo Bonzini blkreq->opaque = req; 3376e790746SPaolo Bonzini blkreq->error = 0; 3386e790746SPaolo Bonzini 3396e790746SPaolo Bonzini mrb->num_writes++; 3406e790746SPaolo Bonzini } 3416e790746SPaolo Bonzini 3426e790746SPaolo Bonzini static void virtio_blk_handle_read(VirtIOBlockReq *req) 3436e790746SPaolo Bonzini { 3446e790746SPaolo Bonzini uint64_t sector; 3456e790746SPaolo Bonzini 346783d1897SRusty Russell sector = virtio_ldq_p(VIRTIO_DEVICE(req->dev), &req->out.sector); 3476e790746SPaolo Bonzini 3486e790746SPaolo Bonzini trace_virtio_blk_handle_read(req, sector, req->qiov.size / 512); 3496e790746SPaolo Bonzini 350d0e14376SMarkus Armbruster if (!virtio_blk_sect_range_ok(req->dev, sector, req->qiov.size)) { 35142e38c1fSMarkus Armbruster virtio_blk_req_complete(req, VIRTIO_BLK_S_IOERR); 35242e38c1fSMarkus Armbruster virtio_blk_free_request(req); 3536e790746SPaolo Bonzini return; 3546e790746SPaolo Bonzini } 35542e38c1fSMarkus Armbruster 3565366d0c8SBenoît Canet block_acct_start(bdrv_get_stats(req->dev->bs), &req->acct, req->qiov.size, 3575366d0c8SBenoît Canet BLOCK_ACCT_READ); 3586e790746SPaolo Bonzini bdrv_aio_readv(req->dev->bs, sector, &req->qiov, 3596e790746SPaolo Bonzini req->qiov.size / BDRV_SECTOR_SIZE, 3606e790746SPaolo Bonzini virtio_blk_rw_complete, req); 3616e790746SPaolo Bonzini } 3626e790746SPaolo Bonzini 363fee65db7SFam Zheng void virtio_blk_handle_request(VirtIOBlockReq *req, MultiReqBuffer *mrb) 3646e790746SPaolo Bonzini { 3656e790746SPaolo Bonzini uint32_t type; 366f897bf75SStefan Hajnoczi struct iovec *in_iov = req->elem.in_sg; 367f897bf75SStefan Hajnoczi struct iovec *iov = req->elem.out_sg; 368f897bf75SStefan Hajnoczi unsigned in_num = req->elem.in_num; 369f897bf75SStefan Hajnoczi unsigned out_num = req->elem.out_num; 3706e790746SPaolo Bonzini 371f897bf75SStefan Hajnoczi if (req->elem.out_num < 1 || req->elem.in_num < 1) { 3726e790746SPaolo Bonzini error_report("virtio-blk missing headers"); 3736e790746SPaolo Bonzini exit(1); 3746e790746SPaolo Bonzini } 3756e790746SPaolo Bonzini 376827805a2SFam Zheng if (unlikely(iov_to_buf(iov, out_num, 0, &req->out, 377827805a2SFam Zheng sizeof(req->out)) != sizeof(req->out))) { 378827805a2SFam Zheng error_report("virtio-blk request outhdr too short"); 379827805a2SFam Zheng exit(1); 380827805a2SFam Zheng } 381ee17e848SFam Zheng 382827805a2SFam Zheng iov_discard_front(&iov, &out_num, sizeof(req->out)); 383ee17e848SFam Zheng 384ee17e848SFam Zheng if (in_num < 1 || 385ee17e848SFam Zheng in_iov[in_num - 1].iov_len < sizeof(struct virtio_blk_inhdr)) { 386ee17e848SFam Zheng error_report("virtio-blk request inhdr too short"); 387ee17e848SFam Zheng exit(1); 388ee17e848SFam Zheng } 389ee17e848SFam Zheng 390ee17e848SFam Zheng req->in = (void *)in_iov[in_num - 1].iov_base 391ee17e848SFam Zheng + in_iov[in_num - 1].iov_len 392ee17e848SFam Zheng - sizeof(struct virtio_blk_inhdr); 393ee17e848SFam Zheng iov_discard_back(in_iov, &in_num, sizeof(struct virtio_blk_inhdr)); 3946e790746SPaolo Bonzini 395783d1897SRusty Russell type = virtio_ldl_p(VIRTIO_DEVICE(req->dev), &req->out.type); 3966e790746SPaolo Bonzini 3976e790746SPaolo Bonzini if (type & VIRTIO_BLK_T_FLUSH) { 3986e790746SPaolo Bonzini virtio_blk_handle_flush(req, mrb); 3996e790746SPaolo Bonzini } else if (type & VIRTIO_BLK_T_SCSI_CMD) { 4006e790746SPaolo Bonzini virtio_blk_handle_scsi(req); 4016e790746SPaolo Bonzini } else if (type & VIRTIO_BLK_T_GET_ID) { 4026e790746SPaolo Bonzini VirtIOBlock *s = req->dev; 4036e790746SPaolo Bonzini 4046e790746SPaolo Bonzini /* 4056e790746SPaolo Bonzini * NB: per existing s/n string convention the string is 4066e790746SPaolo Bonzini * terminated by '\0' only when shorter than buffer. 4076e790746SPaolo Bonzini */ 408a83ceea8SMarc Marí const char *serial = s->blk.serial ? s->blk.serial : ""; 409a83ceea8SMarc Marí size_t size = MIN(strlen(serial) + 1, 410a83ceea8SMarc Marí MIN(iov_size(in_iov, in_num), 411a83ceea8SMarc Marí VIRTIO_BLK_ID_BYTES)); 412a83ceea8SMarc Marí iov_from_buf(in_iov, in_num, 0, serial, size); 4136e790746SPaolo Bonzini virtio_blk_req_complete(req, VIRTIO_BLK_S_OK); 414671ec3f0SFam Zheng virtio_blk_free_request(req); 4156e790746SPaolo Bonzini } else if (type & VIRTIO_BLK_T_OUT) { 416a83ceea8SMarc Marí qemu_iovec_init_external(&req->qiov, iov, out_num); 4176e790746SPaolo Bonzini virtio_blk_handle_write(req, mrb); 4186e790746SPaolo Bonzini } else if (type == VIRTIO_BLK_T_IN || type == VIRTIO_BLK_T_BARRIER) { 4196e790746SPaolo Bonzini /* VIRTIO_BLK_T_IN is 0, so we can't just & it. */ 420a83ceea8SMarc Marí qemu_iovec_init_external(&req->qiov, in_iov, in_num); 4216e790746SPaolo Bonzini virtio_blk_handle_read(req); 4226e790746SPaolo Bonzini } else { 4236e790746SPaolo Bonzini virtio_blk_req_complete(req, VIRTIO_BLK_S_UNSUPP); 424671ec3f0SFam Zheng virtio_blk_free_request(req); 4256e790746SPaolo Bonzini } 4266e790746SPaolo Bonzini } 4276e790746SPaolo Bonzini 4286e790746SPaolo Bonzini static void virtio_blk_handle_output(VirtIODevice *vdev, VirtQueue *vq) 4296e790746SPaolo Bonzini { 4306e790746SPaolo Bonzini VirtIOBlock *s = VIRTIO_BLK(vdev); 4316e790746SPaolo Bonzini VirtIOBlockReq *req; 4326e790746SPaolo Bonzini MultiReqBuffer mrb = { 4336e790746SPaolo Bonzini .num_writes = 0, 4346e790746SPaolo Bonzini }; 4356e790746SPaolo Bonzini 4366e790746SPaolo Bonzini /* Some guests kick before setting VIRTIO_CONFIG_S_DRIVER_OK so start 4376e790746SPaolo Bonzini * dataplane here instead of waiting for .set_status(). 4386e790746SPaolo Bonzini */ 4396e790746SPaolo Bonzini if (s->dataplane) { 4406e790746SPaolo Bonzini virtio_blk_data_plane_start(s->dataplane); 4416e790746SPaolo Bonzini return; 4426e790746SPaolo Bonzini } 4436e790746SPaolo Bonzini 4446e790746SPaolo Bonzini while ((req = virtio_blk_get_request(s))) { 4456e790746SPaolo Bonzini virtio_blk_handle_request(req, &mrb); 4466e790746SPaolo Bonzini } 4476e790746SPaolo Bonzini 4486e790746SPaolo Bonzini virtio_submit_multiwrite(s->bs, &mrb); 4496e790746SPaolo Bonzini 4506e790746SPaolo Bonzini /* 4516e790746SPaolo Bonzini * FIXME: Want to check for completions before returning to guest mode, 4526e790746SPaolo Bonzini * so cached reads and writes are reported as quickly as possible. But 4536e790746SPaolo Bonzini * that should be done in the generic block layer. 4546e790746SPaolo Bonzini */ 4556e790746SPaolo Bonzini } 4566e790746SPaolo Bonzini 4576e790746SPaolo Bonzini static void virtio_blk_dma_restart_bh(void *opaque) 4586e790746SPaolo Bonzini { 4596e790746SPaolo Bonzini VirtIOBlock *s = opaque; 4606e790746SPaolo Bonzini VirtIOBlockReq *req = s->rq; 4616e790746SPaolo Bonzini MultiReqBuffer mrb = { 4626e790746SPaolo Bonzini .num_writes = 0, 4636e790746SPaolo Bonzini }; 4646e790746SPaolo Bonzini 4656e790746SPaolo Bonzini qemu_bh_delete(s->bh); 4666e790746SPaolo Bonzini s->bh = NULL; 4676e790746SPaolo Bonzini 4686e790746SPaolo Bonzini s->rq = NULL; 4696e790746SPaolo Bonzini 4706e790746SPaolo Bonzini while (req) { 4711bdb176aSzhanghailiang VirtIOBlockReq *next = req->next; 4726e790746SPaolo Bonzini virtio_blk_handle_request(req, &mrb); 4731bdb176aSzhanghailiang req = next; 4746e790746SPaolo Bonzini } 4756e790746SPaolo Bonzini 4766e790746SPaolo Bonzini virtio_submit_multiwrite(s->bs, &mrb); 4776e790746SPaolo Bonzini } 4786e790746SPaolo Bonzini 4796e790746SPaolo Bonzini static void virtio_blk_dma_restart_cb(void *opaque, int running, 4806e790746SPaolo Bonzini RunState state) 4816e790746SPaolo Bonzini { 4826e790746SPaolo Bonzini VirtIOBlock *s = opaque; 4836e790746SPaolo Bonzini 4846e790746SPaolo Bonzini if (!running) { 4856e790746SPaolo Bonzini return; 4866e790746SPaolo Bonzini } 4876e790746SPaolo Bonzini 4886e790746SPaolo Bonzini if (!s->bh) { 4894407c1c5SFam Zheng s->bh = aio_bh_new(bdrv_get_aio_context(s->blk.conf.bs), 4904407c1c5SFam Zheng virtio_blk_dma_restart_bh, s); 4916e790746SPaolo Bonzini qemu_bh_schedule(s->bh); 4926e790746SPaolo Bonzini } 4936e790746SPaolo Bonzini } 4946e790746SPaolo Bonzini 4956e790746SPaolo Bonzini static void virtio_blk_reset(VirtIODevice *vdev) 4966e790746SPaolo Bonzini { 4976e790746SPaolo Bonzini VirtIOBlock *s = VIRTIO_BLK(vdev); 4986e790746SPaolo Bonzini 4996e790746SPaolo Bonzini if (s->dataplane) { 5006e790746SPaolo Bonzini virtio_blk_data_plane_stop(s->dataplane); 5016e790746SPaolo Bonzini } 5026e790746SPaolo Bonzini 5036e790746SPaolo Bonzini /* 5046e790746SPaolo Bonzini * This should cancel pending requests, but can't do nicely until there 5056e790746SPaolo Bonzini * are per-device request lists. 5066e790746SPaolo Bonzini */ 5076e790746SPaolo Bonzini bdrv_drain_all(); 508ef5bc962SPaolo Bonzini bdrv_set_enable_write_cache(s->bs, s->original_wce); 5096e790746SPaolo Bonzini } 5106e790746SPaolo Bonzini 5116e790746SPaolo Bonzini /* coalesce internal state, copy to pci i/o region 0 5126e790746SPaolo Bonzini */ 5136e790746SPaolo Bonzini static void virtio_blk_update_config(VirtIODevice *vdev, uint8_t *config) 5146e790746SPaolo Bonzini { 5156e790746SPaolo Bonzini VirtIOBlock *s = VIRTIO_BLK(vdev); 5166e790746SPaolo Bonzini struct virtio_blk_config blkcfg; 5176e790746SPaolo Bonzini uint64_t capacity; 5186e790746SPaolo Bonzini int blk_size = s->conf->logical_block_size; 5196e790746SPaolo Bonzini 5206e790746SPaolo Bonzini bdrv_get_geometry(s->bs, &capacity); 5216e790746SPaolo Bonzini memset(&blkcfg, 0, sizeof(blkcfg)); 522783d1897SRusty Russell virtio_stq_p(vdev, &blkcfg.capacity, capacity); 523783d1897SRusty Russell virtio_stl_p(vdev, &blkcfg.seg_max, 128 - 2); 524783d1897SRusty Russell virtio_stw_p(vdev, &blkcfg.cylinders, s->conf->cyls); 525783d1897SRusty Russell virtio_stl_p(vdev, &blkcfg.blk_size, blk_size); 526783d1897SRusty Russell virtio_stw_p(vdev, &blkcfg.min_io_size, s->conf->min_io_size / blk_size); 527783d1897SRusty Russell virtio_stw_p(vdev, &blkcfg.opt_io_size, s->conf->opt_io_size / blk_size); 5286e790746SPaolo Bonzini blkcfg.heads = s->conf->heads; 5296e790746SPaolo Bonzini /* 5306e790746SPaolo Bonzini * We must ensure that the block device capacity is a multiple of 531e03ba136SPeter Maydell * the logical block size. If that is not the case, let's use 5326e790746SPaolo Bonzini * sector_mask to adopt the geometry to have a correct picture. 5336e790746SPaolo Bonzini * For those devices where the capacity is ok for the given geometry 534e03ba136SPeter Maydell * we don't touch the sector value of the geometry, since some devices 5356e790746SPaolo Bonzini * (like s390 dasd) need a specific value. Here the capacity is already 5366e790746SPaolo Bonzini * cyls*heads*secs*blk_size and the sector value is not block size 5376e790746SPaolo Bonzini * divided by 512 - instead it is the amount of blk_size blocks 5386e790746SPaolo Bonzini * per track (cylinder). 5396e790746SPaolo Bonzini */ 5406e790746SPaolo Bonzini if (bdrv_getlength(s->bs) / s->conf->heads / s->conf->secs % blk_size) { 5416e790746SPaolo Bonzini blkcfg.sectors = s->conf->secs & ~s->sector_mask; 5426e790746SPaolo Bonzini } else { 5436e790746SPaolo Bonzini blkcfg.sectors = s->conf->secs; 5446e790746SPaolo Bonzini } 5456e790746SPaolo Bonzini blkcfg.size_max = 0; 5466e790746SPaolo Bonzini blkcfg.physical_block_exp = get_physical_block_exp(s->conf); 5476e790746SPaolo Bonzini blkcfg.alignment_offset = 0; 5486e790746SPaolo Bonzini blkcfg.wce = bdrv_enable_write_cache(s->bs); 5496e790746SPaolo Bonzini memcpy(config, &blkcfg, sizeof(struct virtio_blk_config)); 5506e790746SPaolo Bonzini } 5516e790746SPaolo Bonzini 5526e790746SPaolo Bonzini static void virtio_blk_set_config(VirtIODevice *vdev, const uint8_t *config) 5536e790746SPaolo Bonzini { 5546e790746SPaolo Bonzini VirtIOBlock *s = VIRTIO_BLK(vdev); 5556e790746SPaolo Bonzini struct virtio_blk_config blkcfg; 5566e790746SPaolo Bonzini 5576e790746SPaolo Bonzini memcpy(&blkcfg, config, sizeof(blkcfg)); 5586d7e73d6SFam Zheng 5596d7e73d6SFam Zheng aio_context_acquire(bdrv_get_aio_context(s->bs)); 5606e790746SPaolo Bonzini bdrv_set_enable_write_cache(s->bs, blkcfg.wce != 0); 5616d7e73d6SFam Zheng aio_context_release(bdrv_get_aio_context(s->bs)); 5626e790746SPaolo Bonzini } 5636e790746SPaolo Bonzini 5646e790746SPaolo Bonzini static uint32_t virtio_blk_get_features(VirtIODevice *vdev, uint32_t features) 5656e790746SPaolo Bonzini { 5666e790746SPaolo Bonzini VirtIOBlock *s = VIRTIO_BLK(vdev); 5676e790746SPaolo Bonzini 5686e790746SPaolo Bonzini features |= (1 << VIRTIO_BLK_F_SEG_MAX); 5696e790746SPaolo Bonzini features |= (1 << VIRTIO_BLK_F_GEOMETRY); 5706e790746SPaolo Bonzini features |= (1 << VIRTIO_BLK_F_TOPOLOGY); 5716e790746SPaolo Bonzini features |= (1 << VIRTIO_BLK_F_BLK_SIZE); 5726e790746SPaolo Bonzini features |= (1 << VIRTIO_BLK_F_SCSI); 5736e790746SPaolo Bonzini 5746e790746SPaolo Bonzini if (s->blk.config_wce) { 5756e790746SPaolo Bonzini features |= (1 << VIRTIO_BLK_F_CONFIG_WCE); 5766e790746SPaolo Bonzini } 5776e790746SPaolo Bonzini if (bdrv_enable_write_cache(s->bs)) 5786e790746SPaolo Bonzini features |= (1 << VIRTIO_BLK_F_WCE); 5796e790746SPaolo Bonzini 5806e790746SPaolo Bonzini if (bdrv_is_read_only(s->bs)) 5816e790746SPaolo Bonzini features |= 1 << VIRTIO_BLK_F_RO; 5826e790746SPaolo Bonzini 5836e790746SPaolo Bonzini return features; 5846e790746SPaolo Bonzini } 5856e790746SPaolo Bonzini 5866e790746SPaolo Bonzini static void virtio_blk_set_status(VirtIODevice *vdev, uint8_t status) 5876e790746SPaolo Bonzini { 5886e790746SPaolo Bonzini VirtIOBlock *s = VIRTIO_BLK(vdev); 5896e790746SPaolo Bonzini uint32_t features; 5906e790746SPaolo Bonzini 5916e790746SPaolo Bonzini if (s->dataplane && !(status & (VIRTIO_CONFIG_S_DRIVER | 5926e790746SPaolo Bonzini VIRTIO_CONFIG_S_DRIVER_OK))) { 5936e790746SPaolo Bonzini virtio_blk_data_plane_stop(s->dataplane); 5946e790746SPaolo Bonzini } 5956e790746SPaolo Bonzini 5966e790746SPaolo Bonzini if (!(status & VIRTIO_CONFIG_S_DRIVER_OK)) { 5976e790746SPaolo Bonzini return; 5986e790746SPaolo Bonzini } 5996e790746SPaolo Bonzini 6006e790746SPaolo Bonzini features = vdev->guest_features; 601ef5bc962SPaolo Bonzini 602ef5bc962SPaolo Bonzini /* A guest that supports VIRTIO_BLK_F_CONFIG_WCE must be able to send 603ef5bc962SPaolo Bonzini * cache flushes. Thus, the "auto writethrough" behavior is never 604ef5bc962SPaolo Bonzini * necessary for guests that support the VIRTIO_BLK_F_CONFIG_WCE feature. 605ef5bc962SPaolo Bonzini * Leaving it enabled would break the following sequence: 606ef5bc962SPaolo Bonzini * 607ef5bc962SPaolo Bonzini * Guest started with "-drive cache=writethrough" 608ef5bc962SPaolo Bonzini * Guest sets status to 0 609ef5bc962SPaolo Bonzini * Guest sets DRIVER bit in status field 610ef5bc962SPaolo Bonzini * Guest reads host features (WCE=0, CONFIG_WCE=1) 611ef5bc962SPaolo Bonzini * Guest writes guest features (WCE=0, CONFIG_WCE=1) 612ef5bc962SPaolo Bonzini * Guest writes 1 to the WCE configuration field (writeback mode) 613ef5bc962SPaolo Bonzini * Guest sets DRIVER_OK bit in status field 614ef5bc962SPaolo Bonzini * 615ef5bc962SPaolo Bonzini * s->bs would erroneously be placed in writethrough mode. 616ef5bc962SPaolo Bonzini */ 617ef5bc962SPaolo Bonzini if (!(features & (1 << VIRTIO_BLK_F_CONFIG_WCE))) { 6186d7e73d6SFam Zheng aio_context_acquire(bdrv_get_aio_context(s->bs)); 6196d7e73d6SFam Zheng bdrv_set_enable_write_cache(s->bs, 6206d7e73d6SFam Zheng !!(features & (1 << VIRTIO_BLK_F_WCE))); 6216d7e73d6SFam Zheng aio_context_release(bdrv_get_aio_context(s->bs)); 6226e790746SPaolo Bonzini } 623ef5bc962SPaolo Bonzini } 6246e790746SPaolo Bonzini 6256e790746SPaolo Bonzini static void virtio_blk_save(QEMUFile *f, void *opaque) 6266e790746SPaolo Bonzini { 627b2b295a7SGreg Kurz VirtIODevice *vdev = VIRTIO_DEVICE(opaque); 6286e790746SPaolo Bonzini 6296e790746SPaolo Bonzini virtio_save(vdev, f); 630b2b295a7SGreg Kurz } 631b2b295a7SGreg Kurz 632b2b295a7SGreg Kurz static void virtio_blk_save_device(VirtIODevice *vdev, QEMUFile *f) 633b2b295a7SGreg Kurz { 634b2b295a7SGreg Kurz VirtIOBlock *s = VIRTIO_BLK(vdev); 635b2b295a7SGreg Kurz VirtIOBlockReq *req = s->rq; 6366e790746SPaolo Bonzini 6376e790746SPaolo Bonzini while (req) { 6386e790746SPaolo Bonzini qemu_put_sbyte(f, 1); 639f897bf75SStefan Hajnoczi qemu_put_buffer(f, (unsigned char *)&req->elem, 640671ec3f0SFam Zheng sizeof(VirtQueueElement)); 6416e790746SPaolo Bonzini req = req->next; 6426e790746SPaolo Bonzini } 6436e790746SPaolo Bonzini qemu_put_sbyte(f, 0); 6446e790746SPaolo Bonzini } 6456e790746SPaolo Bonzini 6466e790746SPaolo Bonzini static int virtio_blk_load(QEMUFile *f, void *opaque, int version_id) 6476e790746SPaolo Bonzini { 6486e790746SPaolo Bonzini VirtIOBlock *s = opaque; 6496e790746SPaolo Bonzini VirtIODevice *vdev = VIRTIO_DEVICE(s); 6506e790746SPaolo Bonzini 6516e790746SPaolo Bonzini if (version_id != 2) 6526e790746SPaolo Bonzini return -EINVAL; 6536e790746SPaolo Bonzini 654b2b295a7SGreg Kurz return virtio_load(vdev, f, version_id); 6556e790746SPaolo Bonzini } 6566e790746SPaolo Bonzini 657b2b295a7SGreg Kurz static int virtio_blk_load_device(VirtIODevice *vdev, QEMUFile *f, 658b2b295a7SGreg Kurz int version_id) 659b2b295a7SGreg Kurz { 660b2b295a7SGreg Kurz VirtIOBlock *s = VIRTIO_BLK(vdev); 661b2b295a7SGreg Kurz 6626e790746SPaolo Bonzini while (qemu_get_sbyte(f)) { 6636e790746SPaolo Bonzini VirtIOBlockReq *req = virtio_blk_alloc_request(s); 664f897bf75SStefan Hajnoczi qemu_get_buffer(f, (unsigned char *)&req->elem, 665671ec3f0SFam Zheng sizeof(VirtQueueElement)); 6666e790746SPaolo Bonzini req->next = s->rq; 6676e790746SPaolo Bonzini s->rq = req; 6686e790746SPaolo Bonzini 669f897bf75SStefan Hajnoczi virtqueue_map_sg(req->elem.in_sg, req->elem.in_addr, 670f897bf75SStefan Hajnoczi req->elem.in_num, 1); 671f897bf75SStefan Hajnoczi virtqueue_map_sg(req->elem.out_sg, req->elem.out_addr, 672f897bf75SStefan Hajnoczi req->elem.out_num, 0); 6736e790746SPaolo Bonzini } 6746e790746SPaolo Bonzini 6756e790746SPaolo Bonzini return 0; 6766e790746SPaolo Bonzini } 6776e790746SPaolo Bonzini 6786e790746SPaolo Bonzini static void virtio_blk_resize(void *opaque) 6796e790746SPaolo Bonzini { 6806e790746SPaolo Bonzini VirtIODevice *vdev = VIRTIO_DEVICE(opaque); 6816e790746SPaolo Bonzini 6826e790746SPaolo Bonzini virtio_notify_config(vdev); 6836e790746SPaolo Bonzini } 6846e790746SPaolo Bonzini 6856e790746SPaolo Bonzini static const BlockDevOps virtio_block_ops = { 6866e790746SPaolo Bonzini .resize_cb = virtio_blk_resize, 6876e790746SPaolo Bonzini }; 6886e790746SPaolo Bonzini 68984db52d0SStefan Hajnoczi /* Disable dataplane thread during live migration since it does not 69084db52d0SStefan Hajnoczi * update the dirty memory bitmap yet. 69184db52d0SStefan Hajnoczi */ 69284db52d0SStefan Hajnoczi static void virtio_blk_migration_state_changed(Notifier *notifier, void *data) 69384db52d0SStefan Hajnoczi { 69484db52d0SStefan Hajnoczi VirtIOBlock *s = container_of(notifier, VirtIOBlock, 69584db52d0SStefan Hajnoczi migration_state_notifier); 69684db52d0SStefan Hajnoczi MigrationState *mig = data; 6973ffeeef7SAndreas Färber Error *err = NULL; 69884db52d0SStefan Hajnoczi 69984db52d0SStefan Hajnoczi if (migration_in_setup(mig)) { 70084db52d0SStefan Hajnoczi if (!s->dataplane) { 70184db52d0SStefan Hajnoczi return; 70284db52d0SStefan Hajnoczi } 70384db52d0SStefan Hajnoczi virtio_blk_data_plane_destroy(s->dataplane); 70484db52d0SStefan Hajnoczi s->dataplane = NULL; 70584db52d0SStefan Hajnoczi } else if (migration_has_finished(mig) || 70684db52d0SStefan Hajnoczi migration_has_failed(mig)) { 70784db52d0SStefan Hajnoczi if (s->dataplane) { 70884db52d0SStefan Hajnoczi return; 70984db52d0SStefan Hajnoczi } 71084db52d0SStefan Hajnoczi bdrv_drain_all(); /* complete in-flight non-dataplane requests */ 71184db52d0SStefan Hajnoczi virtio_blk_data_plane_create(VIRTIO_DEVICE(s), &s->blk, 7123ffeeef7SAndreas Färber &s->dataplane, &err); 7133ffeeef7SAndreas Färber if (err != NULL) { 7143ffeeef7SAndreas Färber error_report("%s", error_get_pretty(err)); 7153ffeeef7SAndreas Färber error_free(err); 7163ffeeef7SAndreas Färber } 71784db52d0SStefan Hajnoczi } 71884db52d0SStefan Hajnoczi } 71984db52d0SStefan Hajnoczi 72075884afdSAndreas Färber static void virtio_blk_device_realize(DeviceState *dev, Error **errp) 7216e790746SPaolo Bonzini { 72275884afdSAndreas Färber VirtIODevice *vdev = VIRTIO_DEVICE(dev); 723179b417eSAndreas Färber VirtIOBlock *s = VIRTIO_BLK(dev); 7246e790746SPaolo Bonzini VirtIOBlkConf *blk = &(s->blk); 7253ffeeef7SAndreas Färber Error *err = NULL; 7266e790746SPaolo Bonzini static int virtio_blk_id; 7276e790746SPaolo Bonzini 7286e790746SPaolo Bonzini if (!blk->conf.bs) { 72975884afdSAndreas Färber error_setg(errp, "drive property not set"); 73075884afdSAndreas Färber return; 7316e790746SPaolo Bonzini } 7326e790746SPaolo Bonzini if (!bdrv_is_inserted(blk->conf.bs)) { 73375884afdSAndreas Färber error_setg(errp, "Device needs media, but drive is empty"); 73475884afdSAndreas Färber return; 7356e790746SPaolo Bonzini } 7366e790746SPaolo Bonzini 7376e790746SPaolo Bonzini blkconf_serial(&blk->conf, &blk->serial); 738ef5bc962SPaolo Bonzini s->original_wce = bdrv_enable_write_cache(blk->conf.bs); 7395ff5efb4SFam Zheng blkconf_geometry(&blk->conf, NULL, 65535, 255, 255, &err); 7405ff5efb4SFam Zheng if (err) { 7415ff5efb4SFam Zheng error_propagate(errp, err); 74275884afdSAndreas Färber return; 7436e790746SPaolo Bonzini } 7446e790746SPaolo Bonzini 7456e790746SPaolo Bonzini virtio_init(vdev, "virtio-blk", VIRTIO_ID_BLOCK, 7466e790746SPaolo Bonzini sizeof(struct virtio_blk_config)); 7476e790746SPaolo Bonzini 7486e790746SPaolo Bonzini s->bs = blk->conf.bs; 7496e790746SPaolo Bonzini s->conf = &blk->conf; 7506e790746SPaolo Bonzini s->rq = NULL; 7516e790746SPaolo Bonzini s->sector_mask = (s->conf->logical_block_size / BDRV_SECTOR_SIZE) - 1; 7526e790746SPaolo Bonzini 7536e790746SPaolo Bonzini s->vq = virtio_add_queue(vdev, 128, virtio_blk_handle_output); 754bf4bd461SFam Zheng s->complete_request = virtio_blk_complete_request; 7553ffeeef7SAndreas Färber virtio_blk_data_plane_create(vdev, blk, &s->dataplane, &err); 7563ffeeef7SAndreas Färber if (err != NULL) { 75775884afdSAndreas Färber error_propagate(errp, err); 7586a1a8cc7SKONRAD Frederic virtio_cleanup(vdev); 75975884afdSAndreas Färber return; 7606e790746SPaolo Bonzini } 76184db52d0SStefan Hajnoczi s->migration_state_notifier.notify = virtio_blk_migration_state_changed; 76284db52d0SStefan Hajnoczi add_migration_state_change_notifier(&s->migration_state_notifier); 7636e790746SPaolo Bonzini 7646e790746SPaolo Bonzini s->change = qemu_add_vm_change_state_handler(virtio_blk_dma_restart_cb, s); 765179b417eSAndreas Färber register_savevm(dev, "virtio-blk", virtio_blk_id++, 2, 7666e790746SPaolo Bonzini virtio_blk_save, virtio_blk_load, s); 7676e790746SPaolo Bonzini bdrv_set_dev_ops(s->bs, &virtio_block_ops, s); 7681b7fd729SPaolo Bonzini bdrv_set_guest_block_size(s->bs, s->conf->logical_block_size); 7696e790746SPaolo Bonzini 7706e790746SPaolo Bonzini bdrv_iostatus_enable(s->bs); 7716e790746SPaolo Bonzini 772179b417eSAndreas Färber add_boot_device_path(s->conf->bootindex, dev, "/disk@0,0"); 7736e790746SPaolo Bonzini } 7746e790746SPaolo Bonzini 775306ec6c3SAndreas Färber static void virtio_blk_device_unrealize(DeviceState *dev, Error **errp) 7766e790746SPaolo Bonzini { 777306ec6c3SAndreas Färber VirtIODevice *vdev = VIRTIO_DEVICE(dev); 778306ec6c3SAndreas Färber VirtIOBlock *s = VIRTIO_BLK(dev); 779306ec6c3SAndreas Färber 78084db52d0SStefan Hajnoczi remove_migration_state_change_notifier(&s->migration_state_notifier); 7816e790746SPaolo Bonzini virtio_blk_data_plane_destroy(s->dataplane); 7826e790746SPaolo Bonzini s->dataplane = NULL; 7836e790746SPaolo Bonzini qemu_del_vm_change_state_handler(s->change); 784306ec6c3SAndreas Färber unregister_savevm(dev, "virtio-blk", s); 7856e790746SPaolo Bonzini blockdev_mark_auto_del(s->bs); 7866a1a8cc7SKONRAD Frederic virtio_cleanup(vdev); 7876e790746SPaolo Bonzini } 7886e790746SPaolo Bonzini 789467b3f33SStefan Hajnoczi static void virtio_blk_instance_init(Object *obj) 790467b3f33SStefan Hajnoczi { 791467b3f33SStefan Hajnoczi VirtIOBlock *s = VIRTIO_BLK(obj); 792467b3f33SStefan Hajnoczi 793467b3f33SStefan Hajnoczi object_property_add_link(obj, "iothread", TYPE_IOTHREAD, 794467b3f33SStefan Hajnoczi (Object **)&s->blk.iothread, 795467b3f33SStefan Hajnoczi qdev_prop_allow_set_link_before_realize, 796467b3f33SStefan Hajnoczi OBJ_PROP_LINK_UNREF_ON_RELEASE, NULL); 797*3342ec32SGonglei device_add_bootindex_property(obj, &s->blk.conf.bootindex, 798*3342ec32SGonglei "bootindex", "/disk@0,0", 799*3342ec32SGonglei DEVICE(obj), NULL); 800467b3f33SStefan Hajnoczi } 801467b3f33SStefan Hajnoczi 8026e790746SPaolo Bonzini static Property virtio_blk_properties[] = { 80332a877e4SStefan Hajnoczi DEFINE_BLOCK_PROPERTIES(VirtIOBlock, blk.conf), 80432a877e4SStefan Hajnoczi DEFINE_BLOCK_CHS_PROPERTIES(VirtIOBlock, blk.conf), 80532a877e4SStefan Hajnoczi DEFINE_PROP_STRING("serial", VirtIOBlock, blk.serial), 80632a877e4SStefan Hajnoczi DEFINE_PROP_BIT("config-wce", VirtIOBlock, blk.config_wce, 0, true), 80732a877e4SStefan Hajnoczi #ifdef __linux__ 80832a877e4SStefan Hajnoczi DEFINE_PROP_BIT("scsi", VirtIOBlock, blk.scsi, 0, true), 80932a877e4SStefan Hajnoczi #endif 81032a877e4SStefan Hajnoczi DEFINE_PROP_BIT("x-data-plane", VirtIOBlock, blk.data_plane, 0, false), 8116e790746SPaolo Bonzini DEFINE_PROP_END_OF_LIST(), 8126e790746SPaolo Bonzini }; 8136e790746SPaolo Bonzini 8146e790746SPaolo Bonzini static void virtio_blk_class_init(ObjectClass *klass, void *data) 8156e790746SPaolo Bonzini { 8166e790746SPaolo Bonzini DeviceClass *dc = DEVICE_CLASS(klass); 8176e790746SPaolo Bonzini VirtioDeviceClass *vdc = VIRTIO_DEVICE_CLASS(klass); 81875884afdSAndreas Färber 8196e790746SPaolo Bonzini dc->props = virtio_blk_properties; 820125ee0edSMarcel Apfelbaum set_bit(DEVICE_CATEGORY_STORAGE, dc->categories); 82175884afdSAndreas Färber vdc->realize = virtio_blk_device_realize; 822306ec6c3SAndreas Färber vdc->unrealize = virtio_blk_device_unrealize; 8236e790746SPaolo Bonzini vdc->get_config = virtio_blk_update_config; 8246e790746SPaolo Bonzini vdc->set_config = virtio_blk_set_config; 8256e790746SPaolo Bonzini vdc->get_features = virtio_blk_get_features; 8266e790746SPaolo Bonzini vdc->set_status = virtio_blk_set_status; 8276e790746SPaolo Bonzini vdc->reset = virtio_blk_reset; 828b2b295a7SGreg Kurz vdc->save = virtio_blk_save_device; 829b2b295a7SGreg Kurz vdc->load = virtio_blk_load_device; 8306e790746SPaolo Bonzini } 8316e790746SPaolo Bonzini 8326e790746SPaolo Bonzini static const TypeInfo virtio_device_info = { 8336e790746SPaolo Bonzini .name = TYPE_VIRTIO_BLK, 8346e790746SPaolo Bonzini .parent = TYPE_VIRTIO_DEVICE, 8356e790746SPaolo Bonzini .instance_size = sizeof(VirtIOBlock), 836467b3f33SStefan Hajnoczi .instance_init = virtio_blk_instance_init, 8376e790746SPaolo Bonzini .class_init = virtio_blk_class_init, 8386e790746SPaolo Bonzini }; 8396e790746SPaolo Bonzini 8406e790746SPaolo Bonzini static void virtio_register_types(void) 8416e790746SPaolo Bonzini { 8426e790746SPaolo Bonzini type_register_static(&virtio_device_info); 8436e790746SPaolo Bonzini } 8446e790746SPaolo Bonzini 8456e790746SPaolo Bonzini type_init(virtio_register_types) 846