16e790746SPaolo Bonzini /* 26e790746SPaolo Bonzini * Virtio Block Device 36e790746SPaolo Bonzini * 46e790746SPaolo Bonzini * Copyright IBM, Corp. 2007 56e790746SPaolo Bonzini * 66e790746SPaolo Bonzini * Authors: 76e790746SPaolo Bonzini * Anthony Liguori <aliguori@us.ibm.com> 86e790746SPaolo Bonzini * 96e790746SPaolo Bonzini * This work is licensed under the terms of the GNU GPL, version 2. See 106e790746SPaolo Bonzini * the COPYING file in the top-level directory. 116e790746SPaolo Bonzini * 126e790746SPaolo Bonzini */ 136e790746SPaolo Bonzini 1480c71a24SPeter Maydell #include "qemu/osdep.h" 15433fcea4SStefan Hajnoczi #include "qemu/defer-call.h" 16da34e65cSMarkus Armbruster #include "qapi/error.h" 17827805a2SFam Zheng #include "qemu/iov.h" 180b8fa32fSMarkus Armbruster #include "qemu/module.h" 196e790746SPaolo Bonzini #include "qemu/error-report.h" 209b92fbcfSSergio Lopez #include "qemu/main-loop.h" 214f736650SSam Li #include "block/block_int.h" 226e790746SPaolo Bonzini #include "trace.h" 236e790746SPaolo Bonzini #include "hw/block/block.h" 24a27bd6c7SMarkus Armbruster #include "hw/qdev-properties.h" 256e790746SPaolo Bonzini #include "sysemu/blockdev.h" 26baf42268SStefan Hajnoczi #include "sysemu/block-ram-registrar.h" 272f780b6aSMarkus Armbruster #include "sysemu/sysemu.h" 2854d31236SMarkus Armbruster #include "sysemu/runstate.h" 296e790746SPaolo Bonzini #include "hw/virtio/virtio-blk.h" 306e790746SPaolo Bonzini #include "dataplane/virtio-blk.h" 3108e2c9f1SPaolo Bonzini #include "scsi/constants.h" 326e790746SPaolo Bonzini #ifdef __linux__ 336e790746SPaolo Bonzini # include <scsi/sg.h> 346e790746SPaolo Bonzini #endif 356e790746SPaolo Bonzini #include "hw/virtio/virtio-bus.h" 36ca77ee28SMarkus Armbruster #include "migration/qemu-file-types.h" 37783d1897SRusty Russell #include "hw/virtio/virtio-access.h" 38d9cf55a8SDaniil Tatianin #include "hw/virtio/virtio-blk-common.h" 394c41c69eSHiroki Narukawa #include "qemu/coroutine.h" 406e790746SPaolo Bonzini 41d14dde5eSGreg Kurz static void virtio_blk_init_request(VirtIOBlock *s, VirtQueue *vq, 42edaffd9fSStefan Hajnoczi VirtIOBlockReq *req) 43671ec3f0SFam Zheng { 44671ec3f0SFam Zheng req->dev = s; 45edaffd9fSStefan Hajnoczi req->vq = vq; 46869d66afSStefan Hajnoczi req->qiov.size = 0; 472a6cdd6dSPaolo Bonzini req->in_len = 0; 48869d66afSStefan Hajnoczi req->next = NULL; 4995f7142aSPeter Lieven req->mr_next = NULL; 50671ec3f0SFam Zheng } 51671ec3f0SFam Zheng 52d14dde5eSGreg Kurz static void virtio_blk_free_request(VirtIOBlockReq *req) 53671ec3f0SFam Zheng { 54c84b3192SPaolo Bonzini g_free(req); 55671ec3f0SFam Zheng } 56671ec3f0SFam Zheng 5703de2f52SPaolo Bonzini static void virtio_blk_req_complete(VirtIOBlockReq *req, unsigned char status) 586e790746SPaolo Bonzini { 596e790746SPaolo Bonzini VirtIOBlock *s = req->dev; 606e790746SPaolo Bonzini VirtIODevice *vdev = VIRTIO_DEVICE(s); 616e790746SPaolo Bonzini 62a576ceacSStefan Hajnoczi trace_virtio_blk_req_complete(vdev, req, status); 636e790746SPaolo Bonzini 646e790746SPaolo Bonzini stb_p(&req->in->status, status); 657bd04a04SStefan Hajnoczi iov_discard_undo(&req->inhdr_undo); 667bd04a04SStefan Hajnoczi iov_discard_undo(&req->outhdr_undo); 67edaffd9fSStefan Hajnoczi virtqueue_push(req->vq, &req->elem, req->in_len); 68eb41cf78SPaolo Bonzini if (s->dataplane_started && !s->dataplane_disabled) { 69edaffd9fSStefan Hajnoczi virtio_blk_data_plane_notify(s->dataplane, req->vq); 7003de2f52SPaolo Bonzini } else { 71edaffd9fSStefan Hajnoczi virtio_notify(vdev, req->vq); 726e790746SPaolo Bonzini } 73bf4bd461SFam Zheng } 74bf4bd461SFam Zheng 756e790746SPaolo Bonzini static int virtio_blk_handle_rw_error(VirtIOBlockReq *req, int error, 7600f639fbSStefano Garzarella bool is_read, bool acct_failed) 776e790746SPaolo Bonzini { 786e790746SPaolo Bonzini VirtIOBlock *s = req->dev; 799a6719d5SStefano Garzarella BlockErrorAction action = blk_get_error_action(s->blk, is_read, error); 806e790746SPaolo Bonzini 81a589569fSWenchao Xia if (action == BLOCK_ERROR_ACTION_STOP) { 82466138dcSFam Zheng /* Break the link as the next request is going to be parsed from the 83466138dcSFam Zheng * ring again. Otherwise we may end up doing a double completion! */ 84466138dcSFam Zheng req->mr_next = NULL; 859c67f33fSStefan Hajnoczi 869c67f33fSStefan Hajnoczi WITH_QEMU_LOCK_GUARD(&s->rq_lock) { 876e790746SPaolo Bonzini req->next = s->rq; 886e790746SPaolo Bonzini s->rq = req; 899c67f33fSStefan Hajnoczi } 90a589569fSWenchao Xia } else if (action == BLOCK_ERROR_ACTION_REPORT) { 916e790746SPaolo Bonzini virtio_blk_req_complete(req, VIRTIO_BLK_S_IOERR); 9200f639fbSStefano Garzarella if (acct_failed) { 9301762e03SAlberto Garcia block_acct_failed(blk_get_stats(s->blk), &req->acct); 9400f639fbSStefano Garzarella } 95671ec3f0SFam Zheng virtio_blk_free_request(req); 966e790746SPaolo Bonzini } 976e790746SPaolo Bonzini 984be74634SMarkus Armbruster blk_error_action(s->blk, action, is_read, error); 99a589569fSWenchao Xia return action != BLOCK_ERROR_ACTION_IGNORE; 1006e790746SPaolo Bonzini } 1016e790746SPaolo Bonzini 1026e790746SPaolo Bonzini static void virtio_blk_rw_complete(void *opaque, int ret) 1036e790746SPaolo Bonzini { 10495f7142aSPeter Lieven VirtIOBlockReq *next = opaque; 105b9e413ddSPaolo Bonzini VirtIOBlock *s = next->dev; 106a576ceacSStefan Hajnoczi VirtIODevice *vdev = VIRTIO_DEVICE(s); 1076e790746SPaolo Bonzini 10895f7142aSPeter Lieven while (next) { 10995f7142aSPeter Lieven VirtIOBlockReq *req = next; 11095f7142aSPeter Lieven next = req->mr_next; 111a576ceacSStefan Hajnoczi trace_virtio_blk_rw_complete(vdev, req, ret); 1126e790746SPaolo Bonzini 11395f7142aSPeter Lieven if (req->qiov.nalloc != -1) { 114e61809edSDongli Zhang /* If nalloc is != -1 req->qiov is a local copy of the original 1159bb192a4SYaowei Bai * external iovec. It was allocated in submit_requests to be 1169bb192a4SYaowei Bai * able to merge requests. */ 11795f7142aSPeter Lieven qemu_iovec_destroy(&req->qiov); 11895f7142aSPeter Lieven } 11995f7142aSPeter Lieven 1206e790746SPaolo Bonzini if (ret) { 121bf4069fbSAnastasiia Rusakova int p = virtio_ldl_p(VIRTIO_DEVICE(s), &req->out.type); 122783d1897SRusty Russell bool is_read = !(p & VIRTIO_BLK_T_OUT); 1232a6cdd6dSPaolo Bonzini /* Note that memory may be dirtied on read failure. If the 1242a6cdd6dSPaolo Bonzini * virtio request is not completed here, as is the case for 1252a6cdd6dSPaolo Bonzini * BLOCK_ERROR_ACTION_STOP, the memory may not be copied 1262a6cdd6dSPaolo Bonzini * correctly during live migration. While this is ugly, 1272a6cdd6dSPaolo Bonzini * it is acceptable because the device is free to write to 1282a6cdd6dSPaolo Bonzini * the memory until the request is completed (which will 1292a6cdd6dSPaolo Bonzini * happen on the other side of the migration). 1302a6cdd6dSPaolo Bonzini */ 13100f639fbSStefano Garzarella if (virtio_blk_handle_rw_error(req, -ret, is_read, true)) { 13295f7142aSPeter Lieven continue; 13395f7142aSPeter Lieven } 1346e790746SPaolo Bonzini } 1356e790746SPaolo Bonzini 1366e790746SPaolo Bonzini virtio_blk_req_complete(req, VIRTIO_BLK_S_OK); 137bf4069fbSAnastasiia Rusakova block_acct_done(blk_get_stats(s->blk), &req->acct); 138671ec3f0SFam Zheng virtio_blk_free_request(req); 1396e790746SPaolo Bonzini } 14095f7142aSPeter Lieven } 1416e790746SPaolo Bonzini 1426e790746SPaolo Bonzini static void virtio_blk_flush_complete(void *opaque, int ret) 1436e790746SPaolo Bonzini { 1446e790746SPaolo Bonzini VirtIOBlockReq *req = opaque; 145b9e413ddSPaolo Bonzini VirtIOBlock *s = req->dev; 1466e790746SPaolo Bonzini 147c1135913SStefan Hajnoczi if (ret && virtio_blk_handle_rw_error(req, -ret, 0, true)) { 148c1135913SStefan Hajnoczi return; 1496e790746SPaolo Bonzini } 1506e790746SPaolo Bonzini 1516e790746SPaolo Bonzini virtio_blk_req_complete(req, VIRTIO_BLK_S_OK); 1529a6719d5SStefano Garzarella block_acct_done(blk_get_stats(s->blk), &req->acct); 153671ec3f0SFam Zheng virtio_blk_free_request(req); 1546e790746SPaolo Bonzini } 1556e790746SPaolo Bonzini 15637b06f8dSStefano Garzarella static void virtio_blk_discard_write_zeroes_complete(void *opaque, int ret) 15737b06f8dSStefano Garzarella { 15837b06f8dSStefano Garzarella VirtIOBlockReq *req = opaque; 15937b06f8dSStefano Garzarella VirtIOBlock *s = req->dev; 16037b06f8dSStefano Garzarella bool is_write_zeroes = (virtio_ldl_p(VIRTIO_DEVICE(s), &req->out.type) & 16137b06f8dSStefano Garzarella ~VIRTIO_BLK_T_BARRIER) == VIRTIO_BLK_T_WRITE_ZEROES; 16237b06f8dSStefano Garzarella 163c1135913SStefan Hajnoczi if (ret && virtio_blk_handle_rw_error(req, -ret, false, is_write_zeroes)) { 164c1135913SStefan Hajnoczi return; 16537b06f8dSStefano Garzarella } 16637b06f8dSStefano Garzarella 16737b06f8dSStefano Garzarella virtio_blk_req_complete(req, VIRTIO_BLK_S_OK); 16837b06f8dSStefano Garzarella if (is_write_zeroes) { 16937b06f8dSStefano Garzarella block_acct_done(blk_get_stats(s->blk), &req->acct); 17037b06f8dSStefano Garzarella } 17137b06f8dSStefano Garzarella virtio_blk_free_request(req); 17237b06f8dSStefano Garzarella } 17337b06f8dSStefano Garzarella 1741dc936aaSFam Zheng #ifdef __linux__ 1751dc936aaSFam Zheng 1761dc936aaSFam Zheng typedef struct { 1771dc936aaSFam Zheng VirtIOBlockReq *req; 1781dc936aaSFam Zheng struct sg_io_hdr hdr; 1791dc936aaSFam Zheng } VirtIOBlockIoctlReq; 1801dc936aaSFam Zheng 1811dc936aaSFam Zheng static void virtio_blk_ioctl_complete(void *opaque, int status) 1821dc936aaSFam Zheng { 1831dc936aaSFam Zheng VirtIOBlockIoctlReq *ioctl_req = opaque; 1841dc936aaSFam Zheng VirtIOBlockReq *req = ioctl_req->req; 1859d456654SPaolo Bonzini VirtIOBlock *s = req->dev; 1869d456654SPaolo Bonzini VirtIODevice *vdev = VIRTIO_DEVICE(s); 1871dc936aaSFam Zheng struct virtio_scsi_inhdr *scsi; 1881dc936aaSFam Zheng struct sg_io_hdr *hdr; 1891dc936aaSFam Zheng 1901dc936aaSFam Zheng scsi = (void *)req->elem.in_sg[req->elem.in_num - 2].iov_base; 1911dc936aaSFam Zheng 1921dc936aaSFam Zheng if (status) { 1931dc936aaSFam Zheng status = VIRTIO_BLK_S_UNSUPP; 1941dc936aaSFam Zheng virtio_stl_p(vdev, &scsi->errors, 255); 1951dc936aaSFam Zheng goto out; 1961dc936aaSFam Zheng } 1971dc936aaSFam Zheng 1981dc936aaSFam Zheng hdr = &ioctl_req->hdr; 1991dc936aaSFam Zheng /* 2001dc936aaSFam Zheng * From SCSI-Generic-HOWTO: "Some lower level drivers (e.g. ide-scsi) 2011dc936aaSFam Zheng * clear the masked_status field [hence status gets cleared too, see 2021dc936aaSFam Zheng * block/scsi_ioctl.c] even when a CHECK_CONDITION or COMMAND_TERMINATED 2031dc936aaSFam Zheng * status has occurred. However they do set DRIVER_SENSE in driver_status 2041dc936aaSFam Zheng * field. Also a (sb_len_wr > 0) indicates there is a sense buffer. 2051dc936aaSFam Zheng */ 2061dc936aaSFam Zheng if (hdr->status == 0 && hdr->sb_len_wr > 0) { 2071dc936aaSFam Zheng hdr->status = CHECK_CONDITION; 2081dc936aaSFam Zheng } 2091dc936aaSFam Zheng 2101dc936aaSFam Zheng virtio_stl_p(vdev, &scsi->errors, 2111dc936aaSFam Zheng hdr->status | (hdr->msg_status << 8) | 2121dc936aaSFam Zheng (hdr->host_status << 16) | (hdr->driver_status << 24)); 2131dc936aaSFam Zheng virtio_stl_p(vdev, &scsi->residual, hdr->resid); 2141dc936aaSFam Zheng virtio_stl_p(vdev, &scsi->sense_len, hdr->sb_len_wr); 2151dc936aaSFam Zheng virtio_stl_p(vdev, &scsi->data_len, hdr->dxfer_len); 2161dc936aaSFam Zheng 2171dc936aaSFam Zheng out: 2181dc936aaSFam Zheng virtio_blk_req_complete(req, status); 2191dc936aaSFam Zheng virtio_blk_free_request(req); 2201dc936aaSFam Zheng g_free(ioctl_req); 2211dc936aaSFam Zheng } 2221dc936aaSFam Zheng 2231dc936aaSFam Zheng #endif 2241dc936aaSFam Zheng 225edaffd9fSStefan Hajnoczi static VirtIOBlockReq *virtio_blk_get_request(VirtIOBlock *s, VirtQueue *vq) 2266e790746SPaolo Bonzini { 227edaffd9fSStefan Hajnoczi VirtIOBlockReq *req = virtqueue_pop(vq, sizeof(VirtIOBlockReq)); 2286e790746SPaolo Bonzini 22951b19ebeSPaolo Bonzini if (req) { 230edaffd9fSStefan Hajnoczi virtio_blk_init_request(s, vq, req); 2316e790746SPaolo Bonzini } 2326e790746SPaolo Bonzini return req; 2336e790746SPaolo Bonzini } 2346e790746SPaolo Bonzini 23575344fa4SFam Zheng static int virtio_blk_handle_scsi_req(VirtIOBlockReq *req) 2366e790746SPaolo Bonzini { 2376e790746SPaolo Bonzini int status = VIRTIO_BLK_S_OK; 2385a05cbeeSFam Zheng struct virtio_scsi_inhdr *scsi = NULL; 23975344fa4SFam Zheng VirtIOBlock *blk = req->dev; 240bf4069fbSAnastasiia Rusakova VirtIODevice *vdev = VIRTIO_DEVICE(blk); 241bf4069fbSAnastasiia Rusakova VirtQueueElement *elem = &req->elem; 242783d1897SRusty Russell 2435a05cbeeSFam Zheng #ifdef __linux__ 2445a05cbeeSFam Zheng int i; 2451dc936aaSFam Zheng VirtIOBlockIoctlReq *ioctl_req; 246a209f461SFam Zheng BlockAIOCB *acb; 2475a05cbeeSFam Zheng #endif 2486e790746SPaolo Bonzini 2496e790746SPaolo Bonzini /* 2506e790746SPaolo Bonzini * We require at least one output segment each for the virtio_blk_outhdr 2516e790746SPaolo Bonzini * and the SCSI command block. 2526e790746SPaolo Bonzini * 2536e790746SPaolo Bonzini * We also at least require the virtio_blk_inhdr, the virtio_scsi_inhdr 2546e790746SPaolo Bonzini * and the sense buffer pointer in the input segments. 2556e790746SPaolo Bonzini */ 2565a05cbeeSFam Zheng if (elem->out_num < 2 || elem->in_num < 3) { 2575a05cbeeSFam Zheng status = VIRTIO_BLK_S_IOERR; 2585a05cbeeSFam Zheng goto fail; 2596e790746SPaolo Bonzini } 2606e790746SPaolo Bonzini 2616e790746SPaolo Bonzini /* 2626e790746SPaolo Bonzini * The scsi inhdr is placed in the second-to-last input segment, just 2636e790746SPaolo Bonzini * before the regular inhdr. 2646e790746SPaolo Bonzini */ 2655a05cbeeSFam Zheng scsi = (void *)elem->in_sg[elem->in_num - 2].iov_base; 2666e790746SPaolo Bonzini 267bbe8bd4dSStefano Garzarella if (!virtio_has_feature(blk->host_features, VIRTIO_BLK_F_SCSI)) { 2686e790746SPaolo Bonzini status = VIRTIO_BLK_S_UNSUPP; 2696e790746SPaolo Bonzini goto fail; 2706e790746SPaolo Bonzini } 2716e790746SPaolo Bonzini 2726e790746SPaolo Bonzini /* 2736e790746SPaolo Bonzini * No support for bidirection commands yet. 2746e790746SPaolo Bonzini */ 2755a05cbeeSFam Zheng if (elem->out_num > 2 && elem->in_num > 3) { 2766e790746SPaolo Bonzini status = VIRTIO_BLK_S_UNSUPP; 2776e790746SPaolo Bonzini goto fail; 2786e790746SPaolo Bonzini } 2796e790746SPaolo Bonzini 2806e790746SPaolo Bonzini #ifdef __linux__ 2811dc936aaSFam Zheng ioctl_req = g_new0(VirtIOBlockIoctlReq, 1); 2821dc936aaSFam Zheng ioctl_req->req = req; 2831dc936aaSFam Zheng ioctl_req->hdr.interface_id = 'S'; 2841dc936aaSFam Zheng ioctl_req->hdr.cmd_len = elem->out_sg[1].iov_len; 2851dc936aaSFam Zheng ioctl_req->hdr.cmdp = elem->out_sg[1].iov_base; 2861dc936aaSFam Zheng ioctl_req->hdr.dxfer_len = 0; 2876e790746SPaolo Bonzini 2885a05cbeeSFam Zheng if (elem->out_num > 2) { 2896e790746SPaolo Bonzini /* 2906e790746SPaolo Bonzini * If there are more than the minimally required 2 output segments 2916e790746SPaolo Bonzini * there is write payload starting from the third iovec. 2926e790746SPaolo Bonzini */ 2931dc936aaSFam Zheng ioctl_req->hdr.dxfer_direction = SG_DXFER_TO_DEV; 2941dc936aaSFam Zheng ioctl_req->hdr.iovec_count = elem->out_num - 2; 2956e790746SPaolo Bonzini 2961dc936aaSFam Zheng for (i = 0; i < ioctl_req->hdr.iovec_count; i++) { 2971dc936aaSFam Zheng ioctl_req->hdr.dxfer_len += elem->out_sg[i + 2].iov_len; 2981dc936aaSFam Zheng } 2996e790746SPaolo Bonzini 3001dc936aaSFam Zheng ioctl_req->hdr.dxferp = elem->out_sg + 2; 3016e790746SPaolo Bonzini 3025a05cbeeSFam Zheng } else if (elem->in_num > 3) { 3036e790746SPaolo Bonzini /* 3046e790746SPaolo Bonzini * If we have more than 3 input segments the guest wants to actually 3056e790746SPaolo Bonzini * read data. 3066e790746SPaolo Bonzini */ 3071dc936aaSFam Zheng ioctl_req->hdr.dxfer_direction = SG_DXFER_FROM_DEV; 3081dc936aaSFam Zheng ioctl_req->hdr.iovec_count = elem->in_num - 3; 3091dc936aaSFam Zheng for (i = 0; i < ioctl_req->hdr.iovec_count; i++) { 3101dc936aaSFam Zheng ioctl_req->hdr.dxfer_len += elem->in_sg[i].iov_len; 3111dc936aaSFam Zheng } 3126e790746SPaolo Bonzini 3131dc936aaSFam Zheng ioctl_req->hdr.dxferp = elem->in_sg; 3146e790746SPaolo Bonzini } else { 3156e790746SPaolo Bonzini /* 3166e790746SPaolo Bonzini * Some SCSI commands don't actually transfer any data. 3176e790746SPaolo Bonzini */ 3181dc936aaSFam Zheng ioctl_req->hdr.dxfer_direction = SG_DXFER_NONE; 3196e790746SPaolo Bonzini } 3206e790746SPaolo Bonzini 3211dc936aaSFam Zheng ioctl_req->hdr.sbp = elem->in_sg[elem->in_num - 3].iov_base; 3221dc936aaSFam Zheng ioctl_req->hdr.mx_sb_len = elem->in_sg[elem->in_num - 3].iov_len; 3236e790746SPaolo Bonzini 324a209f461SFam Zheng acb = blk_aio_ioctl(blk->blk, SG_IO, &ioctl_req->hdr, 3251dc936aaSFam Zheng virtio_blk_ioctl_complete, ioctl_req); 326a209f461SFam Zheng if (!acb) { 327a209f461SFam Zheng g_free(ioctl_req); 328a209f461SFam Zheng status = VIRTIO_BLK_S_UNSUPP; 329a209f461SFam Zheng goto fail; 330a209f461SFam Zheng } 3311dc936aaSFam Zheng return -EINPROGRESS; 3326e790746SPaolo Bonzini #else 3336e790746SPaolo Bonzini abort(); 3346e790746SPaolo Bonzini #endif 3356e790746SPaolo Bonzini 3366e790746SPaolo Bonzini fail: 3376e790746SPaolo Bonzini /* Just put anything nonzero so that the ioctl fails in the guest. */ 3385a05cbeeSFam Zheng if (scsi) { 339783d1897SRusty Russell virtio_stl_p(vdev, &scsi->errors, 255); 3405a05cbeeSFam Zheng } 3415a05cbeeSFam Zheng return status; 3425a05cbeeSFam Zheng } 3435a05cbeeSFam Zheng 3445a05cbeeSFam Zheng static void virtio_blk_handle_scsi(VirtIOBlockReq *req) 3455a05cbeeSFam Zheng { 3465a05cbeeSFam Zheng int status; 3475a05cbeeSFam Zheng 34875344fa4SFam Zheng status = virtio_blk_handle_scsi_req(req); 3491dc936aaSFam Zheng if (status != -EINPROGRESS) { 3506e790746SPaolo Bonzini virtio_blk_req_complete(req, status); 351671ec3f0SFam Zheng virtio_blk_free_request(req); 3526e790746SPaolo Bonzini } 3531dc936aaSFam Zheng } 3546e790746SPaolo Bonzini 355baf42268SStefan Hajnoczi static inline void submit_requests(VirtIOBlock *s, MultiReqBuffer *mrb, 35695f7142aSPeter Lieven int start, int num_reqs, int niov) 3576e790746SPaolo Bonzini { 358baf42268SStefan Hajnoczi BlockBackend *blk = s->blk; 35995f7142aSPeter Lieven QEMUIOVector *qiov = &mrb->reqs[start]->qiov; 36095f7142aSPeter Lieven int64_t sector_num = mrb->reqs[start]->sector_num; 36195f7142aSPeter Lieven bool is_write = mrb->is_write; 362baf42268SStefan Hajnoczi BdrvRequestFlags flags = 0; 3636e790746SPaolo Bonzini 36495f7142aSPeter Lieven if (num_reqs > 1) { 36595f7142aSPeter Lieven int i; 36695f7142aSPeter Lieven struct iovec *tmp_iov = qiov->iov; 36795f7142aSPeter Lieven int tmp_niov = qiov->niov; 36895f7142aSPeter Lieven 36995f7142aSPeter Lieven /* mrb->reqs[start]->qiov was initialized from external so we can't 370b5772fddSEric Blake * modify it here. We need to initialize it locally and then add the 37195f7142aSPeter Lieven * external iovecs. */ 37295f7142aSPeter Lieven qemu_iovec_init(qiov, niov); 37395f7142aSPeter Lieven 37495f7142aSPeter Lieven for (i = 0; i < tmp_niov; i++) { 37595f7142aSPeter Lieven qemu_iovec_add(qiov, tmp_iov[i].iov_base, tmp_iov[i].iov_len); 37695f7142aSPeter Lieven } 37795f7142aSPeter Lieven 37895f7142aSPeter Lieven for (i = start + 1; i < start + num_reqs; i++) { 37995f7142aSPeter Lieven qemu_iovec_concat(qiov, &mrb->reqs[i]->qiov, 0, 38095f7142aSPeter Lieven mrb->reqs[i]->qiov.size); 38195f7142aSPeter Lieven mrb->reqs[i - 1]->mr_next = mrb->reqs[i]; 38295f7142aSPeter Lieven } 38395f7142aSPeter Lieven 384a576ceacSStefan Hajnoczi trace_virtio_blk_submit_multireq(VIRTIO_DEVICE(mrb->reqs[start]->dev), 385a576ceacSStefan Hajnoczi mrb, start, num_reqs, 386b5772fddSEric Blake sector_num << BDRV_SECTOR_BITS, 387b5772fddSEric Blake qiov->size, is_write); 38895f7142aSPeter Lieven block_acct_merge_done(blk_get_stats(blk), 38995f7142aSPeter Lieven is_write ? BLOCK_ACCT_WRITE : BLOCK_ACCT_READ, 39095f7142aSPeter Lieven num_reqs - 1); 39195f7142aSPeter Lieven } 39295f7142aSPeter Lieven 393baf42268SStefan Hajnoczi if (blk_ram_registrar_ok(&s->blk_ram_registrar)) { 394baf42268SStefan Hajnoczi flags |= BDRV_REQ_REGISTERED_BUF; 395baf42268SStefan Hajnoczi } 396baf42268SStefan Hajnoczi 39795f7142aSPeter Lieven if (is_write) { 398baf42268SStefan Hajnoczi blk_aio_pwritev(blk, sector_num << BDRV_SECTOR_BITS, qiov, 399baf42268SStefan Hajnoczi flags, virtio_blk_rw_complete, 400baf42268SStefan Hajnoczi mrb->reqs[start]); 40195f7142aSPeter Lieven } else { 402baf42268SStefan Hajnoczi blk_aio_preadv(blk, sector_num << BDRV_SECTOR_BITS, qiov, 403baf42268SStefan Hajnoczi flags, virtio_blk_rw_complete, 404baf42268SStefan Hajnoczi mrb->reqs[start]); 40595f7142aSPeter Lieven } 40695f7142aSPeter Lieven } 40795f7142aSPeter Lieven 40895f7142aSPeter Lieven static int multireq_compare(const void *a, const void *b) 40995f7142aSPeter Lieven { 41095f7142aSPeter Lieven const VirtIOBlockReq *req1 = *(VirtIOBlockReq **)a, 41195f7142aSPeter Lieven *req2 = *(VirtIOBlockReq **)b; 41295f7142aSPeter Lieven 41395f7142aSPeter Lieven /* 41495f7142aSPeter Lieven * Note that we can't simply subtract sector_num1 from sector_num2 41595f7142aSPeter Lieven * here as that could overflow the return value. 41695f7142aSPeter Lieven */ 41795f7142aSPeter Lieven if (req1->sector_num > req2->sector_num) { 41895f7142aSPeter Lieven return 1; 41995f7142aSPeter Lieven } else if (req1->sector_num < req2->sector_num) { 42095f7142aSPeter Lieven return -1; 42195f7142aSPeter Lieven } else { 42295f7142aSPeter Lieven return 0; 42395f7142aSPeter Lieven } 42495f7142aSPeter Lieven } 42595f7142aSPeter Lieven 426baf42268SStefan Hajnoczi static void virtio_blk_submit_multireq(VirtIOBlock *s, MultiReqBuffer *mrb) 42795f7142aSPeter Lieven { 42895f7142aSPeter Lieven int i = 0, start = 0, num_reqs = 0, niov = 0, nb_sectors = 0; 4295def6b80SEric Blake uint32_t max_transfer; 43095f7142aSPeter Lieven int64_t sector_num = 0; 43195f7142aSPeter Lieven 43295f7142aSPeter Lieven if (mrb->num_reqs == 1) { 433baf42268SStefan Hajnoczi submit_requests(s, mrb, 0, 1, -1); 43495f7142aSPeter Lieven mrb->num_reqs = 0; 4356e790746SPaolo Bonzini return; 4366e790746SPaolo Bonzini } 4376e790746SPaolo Bonzini 4385def6b80SEric Blake max_transfer = blk_get_max_transfer(mrb->reqs[0]->dev->blk); 43995f7142aSPeter Lieven 44095f7142aSPeter Lieven qsort(mrb->reqs, mrb->num_reqs, sizeof(*mrb->reqs), 44195f7142aSPeter Lieven &multireq_compare); 44295f7142aSPeter Lieven 44395f7142aSPeter Lieven for (i = 0; i < mrb->num_reqs; i++) { 44495f7142aSPeter Lieven VirtIOBlockReq *req = mrb->reqs[i]; 44595f7142aSPeter Lieven if (num_reqs > 0) { 44649cffbc6SGonglei /* 44749cffbc6SGonglei * NOTE: We cannot merge the requests in below situations: 44849cffbc6SGonglei * 1. requests are not sequential 44949cffbc6SGonglei * 2. merge would exceed maximum number of IOVs 45049cffbc6SGonglei * 3. merge would exceed maximum transfer length of backend device 45149cffbc6SGonglei */ 45249cffbc6SGonglei if (sector_num + nb_sectors != req->sector_num || 453baf42268SStefan Hajnoczi niov > blk_get_max_iov(s->blk) - req->qiov.niov || 4545def6b80SEric Blake req->qiov.size > max_transfer || 4555def6b80SEric Blake nb_sectors > (max_transfer - 4565def6b80SEric Blake req->qiov.size) / BDRV_SECTOR_SIZE) { 457baf42268SStefan Hajnoczi submit_requests(s, mrb, start, num_reqs, niov); 45895f7142aSPeter Lieven num_reqs = 0; 4596e790746SPaolo Bonzini } 4606e790746SPaolo Bonzini } 4616e790746SPaolo Bonzini 46295f7142aSPeter Lieven if (num_reqs == 0) { 46395f7142aSPeter Lieven sector_num = req->sector_num; 46495f7142aSPeter Lieven nb_sectors = niov = 0; 46595f7142aSPeter Lieven start = i; 46695f7142aSPeter Lieven } 46795f7142aSPeter Lieven 46895f7142aSPeter Lieven nb_sectors += req->qiov.size / BDRV_SECTOR_SIZE; 46995f7142aSPeter Lieven niov += req->qiov.niov; 47095f7142aSPeter Lieven num_reqs++; 47195f7142aSPeter Lieven } 47295f7142aSPeter Lieven 473baf42268SStefan Hajnoczi submit_requests(s, mrb, start, num_reqs, niov); 47495f7142aSPeter Lieven mrb->num_reqs = 0; 4756e790746SPaolo Bonzini } 4766e790746SPaolo Bonzini 4776e790746SPaolo Bonzini static void virtio_blk_handle_flush(VirtIOBlockReq *req, MultiReqBuffer *mrb) 4786e790746SPaolo Bonzini { 479bf4069fbSAnastasiia Rusakova VirtIOBlock *s = req->dev; 480bf4069fbSAnastasiia Rusakova 481bf4069fbSAnastasiia Rusakova block_acct_start(blk_get_stats(s->blk), &req->acct, 0, 4825366d0c8SBenoît Canet BLOCK_ACCT_FLUSH); 4836e790746SPaolo Bonzini 4846e790746SPaolo Bonzini /* 4856e790746SPaolo Bonzini * Make sure all outstanding writes are posted to the backing device. 4866e790746SPaolo Bonzini */ 48795f7142aSPeter Lieven if (mrb->is_write && mrb->num_reqs > 0) { 488baf42268SStefan Hajnoczi virtio_blk_submit_multireq(s, mrb); 48995f7142aSPeter Lieven } 490bf4069fbSAnastasiia Rusakova blk_aio_flush(s->blk, virtio_blk_flush_complete, req); 4916e790746SPaolo Bonzini } 4926e790746SPaolo Bonzini 493d0e14376SMarkus Armbruster static bool virtio_blk_sect_range_ok(VirtIOBlock *dev, 494d0e14376SMarkus Armbruster uint64_t sector, size_t size) 495d0e14376SMarkus Armbruster { 4963c2daac0SMarkus Armbruster uint64_t nb_sectors = size >> BDRV_SECTOR_BITS; 4973c2daac0SMarkus Armbruster uint64_t total_sectors; 4983c2daac0SMarkus Armbruster 49975af1f34SPeter Lieven if (nb_sectors > BDRV_REQUEST_MAX_SECTORS) { 50095f7142aSPeter Lieven return false; 50195f7142aSPeter Lieven } 502d0e14376SMarkus Armbruster if (sector & dev->sector_mask) { 503d0e14376SMarkus Armbruster return false; 504d0e14376SMarkus Armbruster } 5052a30307fSMarkus Armbruster if (size % dev->conf.conf.logical_block_size) { 506d0e14376SMarkus Armbruster return false; 507d0e14376SMarkus Armbruster } 5084be74634SMarkus Armbruster blk_get_geometry(dev->blk, &total_sectors); 5093c2daac0SMarkus Armbruster if (sector > total_sectors || nb_sectors > total_sectors - sector) { 5103c2daac0SMarkus Armbruster return false; 5113c2daac0SMarkus Armbruster } 512d0e14376SMarkus Armbruster return true; 513d0e14376SMarkus Armbruster } 514d0e14376SMarkus Armbruster 51537b06f8dSStefano Garzarella static uint8_t virtio_blk_handle_discard_write_zeroes(VirtIOBlockReq *req, 51637b06f8dSStefano Garzarella struct virtio_blk_discard_write_zeroes *dwz_hdr, bool is_write_zeroes) 51737b06f8dSStefano Garzarella { 51837b06f8dSStefano Garzarella VirtIOBlock *s = req->dev; 51937b06f8dSStefano Garzarella VirtIODevice *vdev = VIRTIO_DEVICE(s); 52037b06f8dSStefano Garzarella uint64_t sector; 52137b06f8dSStefano Garzarella uint32_t num_sectors, flags, max_sectors; 52237b06f8dSStefano Garzarella uint8_t err_status; 52337b06f8dSStefano Garzarella int bytes; 52437b06f8dSStefano Garzarella 52537b06f8dSStefano Garzarella sector = virtio_ldq_p(vdev, &dwz_hdr->sector); 52637b06f8dSStefano Garzarella num_sectors = virtio_ldl_p(vdev, &dwz_hdr->num_sectors); 52737b06f8dSStefano Garzarella flags = virtio_ldl_p(vdev, &dwz_hdr->flags); 52837b06f8dSStefano Garzarella max_sectors = is_write_zeroes ? s->conf.max_write_zeroes_sectors : 52937b06f8dSStefano Garzarella s->conf.max_discard_sectors; 53037b06f8dSStefano Garzarella 53137b06f8dSStefano Garzarella /* 53237b06f8dSStefano Garzarella * max_sectors is at most BDRV_REQUEST_MAX_SECTORS, this check 53337b06f8dSStefano Garzarella * make us sure that "num_sectors << BDRV_SECTOR_BITS" can fit in 53437b06f8dSStefano Garzarella * the integer variable. 53537b06f8dSStefano Garzarella */ 53637b06f8dSStefano Garzarella if (unlikely(num_sectors > max_sectors)) { 53737b06f8dSStefano Garzarella err_status = VIRTIO_BLK_S_IOERR; 53837b06f8dSStefano Garzarella goto err; 53937b06f8dSStefano Garzarella } 54037b06f8dSStefano Garzarella 54137b06f8dSStefano Garzarella bytes = num_sectors << BDRV_SECTOR_BITS; 54237b06f8dSStefano Garzarella 54337b06f8dSStefano Garzarella if (unlikely(!virtio_blk_sect_range_ok(s, sector, bytes))) { 54437b06f8dSStefano Garzarella err_status = VIRTIO_BLK_S_IOERR; 54537b06f8dSStefano Garzarella goto err; 54637b06f8dSStefano Garzarella } 54737b06f8dSStefano Garzarella 54837b06f8dSStefano Garzarella /* 54937b06f8dSStefano Garzarella * The device MUST set the status byte to VIRTIO_BLK_S_UNSUPP for discard 55037b06f8dSStefano Garzarella * and write zeroes commands if any unknown flag is set. 55137b06f8dSStefano Garzarella */ 55237b06f8dSStefano Garzarella if (unlikely(flags & ~VIRTIO_BLK_WRITE_ZEROES_FLAG_UNMAP)) { 55337b06f8dSStefano Garzarella err_status = VIRTIO_BLK_S_UNSUPP; 55437b06f8dSStefano Garzarella goto err; 55537b06f8dSStefano Garzarella } 55637b06f8dSStefano Garzarella 55737b06f8dSStefano Garzarella if (is_write_zeroes) { /* VIRTIO_BLK_T_WRITE_ZEROES */ 55837b06f8dSStefano Garzarella int blk_aio_flags = 0; 55937b06f8dSStefano Garzarella 56037b06f8dSStefano Garzarella if (flags & VIRTIO_BLK_WRITE_ZEROES_FLAG_UNMAP) { 56137b06f8dSStefano Garzarella blk_aio_flags |= BDRV_REQ_MAY_UNMAP; 56237b06f8dSStefano Garzarella } 56337b06f8dSStefano Garzarella 56437b06f8dSStefano Garzarella block_acct_start(blk_get_stats(s->blk), &req->acct, bytes, 56537b06f8dSStefano Garzarella BLOCK_ACCT_WRITE); 56637b06f8dSStefano Garzarella 56737b06f8dSStefano Garzarella blk_aio_pwrite_zeroes(s->blk, sector << BDRV_SECTOR_BITS, 56837b06f8dSStefano Garzarella bytes, blk_aio_flags, 56937b06f8dSStefano Garzarella virtio_blk_discard_write_zeroes_complete, req); 57037b06f8dSStefano Garzarella } else { /* VIRTIO_BLK_T_DISCARD */ 57137b06f8dSStefano Garzarella /* 57237b06f8dSStefano Garzarella * The device MUST set the status byte to VIRTIO_BLK_S_UNSUPP for 57337b06f8dSStefano Garzarella * discard commands if the unmap flag is set. 57437b06f8dSStefano Garzarella */ 57537b06f8dSStefano Garzarella if (unlikely(flags & VIRTIO_BLK_WRITE_ZEROES_FLAG_UNMAP)) { 57637b06f8dSStefano Garzarella err_status = VIRTIO_BLK_S_UNSUPP; 57737b06f8dSStefano Garzarella goto err; 57837b06f8dSStefano Garzarella } 57937b06f8dSStefano Garzarella 58037b06f8dSStefano Garzarella blk_aio_pdiscard(s->blk, sector << BDRV_SECTOR_BITS, bytes, 58137b06f8dSStefano Garzarella virtio_blk_discard_write_zeroes_complete, req); 58237b06f8dSStefano Garzarella } 58337b06f8dSStefano Garzarella 58437b06f8dSStefano Garzarella return VIRTIO_BLK_S_OK; 58537b06f8dSStefano Garzarella 58637b06f8dSStefano Garzarella err: 58737b06f8dSStefano Garzarella if (is_write_zeroes) { 58837b06f8dSStefano Garzarella block_acct_invalid(blk_get_stats(s->blk), BLOCK_ACCT_WRITE); 58937b06f8dSStefano Garzarella } 59037b06f8dSStefano Garzarella return err_status; 59137b06f8dSStefano Garzarella } 59237b06f8dSStefano Garzarella 5934f736650SSam Li typedef struct ZoneCmdData { 5944f736650SSam Li VirtIOBlockReq *req; 5954f736650SSam Li struct iovec *in_iov; 5964f736650SSam Li unsigned in_num; 5974f736650SSam Li union { 5984f736650SSam Li struct { 5994f736650SSam Li unsigned int nr_zones; 6004f736650SSam Li BlockZoneDescriptor *zones; 6014f736650SSam Li } zone_report_data; 6024f736650SSam Li struct { 6034f736650SSam Li int64_t offset; 6044f736650SSam Li } zone_append_data; 6054f736650SSam Li }; 6064f736650SSam Li } ZoneCmdData; 6074f736650SSam Li 6084f736650SSam Li /* 6094f736650SSam Li * check zoned_request: error checking before issuing requests. If all checks 6104f736650SSam Li * passed, return true. 6114f736650SSam Li * append: true if only zone append requests issued. 6124f736650SSam Li */ 6134f736650SSam Li static bool check_zoned_request(VirtIOBlock *s, int64_t offset, int64_t len, 6144f736650SSam Li bool append, uint8_t *status) { 6154f736650SSam Li BlockDriverState *bs = blk_bs(s->blk); 6164f736650SSam Li int index; 6174f736650SSam Li 6184f736650SSam Li if (!virtio_has_feature(s->host_features, VIRTIO_BLK_F_ZONED)) { 6194f736650SSam Li *status = VIRTIO_BLK_S_UNSUPP; 6204f736650SSam Li return false; 6214f736650SSam Li } 6224f736650SSam Li 6234f736650SSam Li if (offset < 0 || len < 0 || len > (bs->total_sectors << BDRV_SECTOR_BITS) 6244f736650SSam Li || offset > (bs->total_sectors << BDRV_SECTOR_BITS) - len) { 6254f736650SSam Li *status = VIRTIO_BLK_S_ZONE_INVALID_CMD; 6264f736650SSam Li return false; 6274f736650SSam Li } 6284f736650SSam Li 6294f736650SSam Li if (append) { 6304f736650SSam Li if (bs->bl.write_granularity) { 6314f736650SSam Li if ((offset % bs->bl.write_granularity) != 0) { 6324f736650SSam Li *status = VIRTIO_BLK_S_ZONE_UNALIGNED_WP; 6334f736650SSam Li return false; 6344f736650SSam Li } 6354f736650SSam Li } 6364f736650SSam Li 6374f736650SSam Li index = offset / bs->bl.zone_size; 6384f736650SSam Li if (BDRV_ZT_IS_CONV(bs->wps->wp[index])) { 6394f736650SSam Li *status = VIRTIO_BLK_S_ZONE_INVALID_CMD; 6404f736650SSam Li return false; 6414f736650SSam Li } 6424f736650SSam Li 6434f736650SSam Li if (len / 512 > bs->bl.max_append_sectors) { 6444f736650SSam Li if (bs->bl.max_append_sectors == 0) { 6454f736650SSam Li *status = VIRTIO_BLK_S_UNSUPP; 6464f736650SSam Li } else { 6474f736650SSam Li *status = VIRTIO_BLK_S_ZONE_INVALID_CMD; 6484f736650SSam Li } 6494f736650SSam Li return false; 6504f736650SSam Li } 6514f736650SSam Li } 6524f736650SSam Li return true; 6534f736650SSam Li } 6544f736650SSam Li 6554f736650SSam Li static void virtio_blk_zone_report_complete(void *opaque, int ret) 6564f736650SSam Li { 6574f736650SSam Li ZoneCmdData *data = opaque; 6584f736650SSam Li VirtIOBlockReq *req = data->req; 6594f736650SSam Li VirtIODevice *vdev = VIRTIO_DEVICE(req->dev); 6604f736650SSam Li struct iovec *in_iov = data->in_iov; 6614f736650SSam Li unsigned in_num = data->in_num; 6624f736650SSam Li int64_t zrp_size, n, j = 0; 6634f736650SSam Li int64_t nz = data->zone_report_data.nr_zones; 6644f736650SSam Li int8_t err_status = VIRTIO_BLK_S_OK; 6654f736650SSam Li 6664e92acf7SSam Li trace_virtio_blk_zone_report_complete(vdev, req, nz, ret); 6674f736650SSam Li if (ret) { 6684f736650SSam Li err_status = VIRTIO_BLK_S_ZONE_INVALID_CMD; 6694f736650SSam Li goto out; 6704f736650SSam Li } 6714f736650SSam Li 6724f736650SSam Li struct virtio_blk_zone_report zrp_hdr = (struct virtio_blk_zone_report) { 6734f736650SSam Li .nr_zones = cpu_to_le64(nz), 6744f736650SSam Li }; 6754f736650SSam Li zrp_size = sizeof(struct virtio_blk_zone_report) 6764f736650SSam Li + sizeof(struct virtio_blk_zone_descriptor) * nz; 6774f736650SSam Li n = iov_from_buf(in_iov, in_num, 0, &zrp_hdr, sizeof(zrp_hdr)); 6784f736650SSam Li if (n != sizeof(zrp_hdr)) { 6794f736650SSam Li virtio_error(vdev, "Driver provided input buffer that is too small!"); 6804f736650SSam Li err_status = VIRTIO_BLK_S_ZONE_INVALID_CMD; 6814f736650SSam Li goto out; 6824f736650SSam Li } 6834f736650SSam Li 6844f736650SSam Li for (size_t i = sizeof(zrp_hdr); i < zrp_size; 6854f736650SSam Li i += sizeof(struct virtio_blk_zone_descriptor), ++j) { 6864f736650SSam Li struct virtio_blk_zone_descriptor desc = 6874f736650SSam Li (struct virtio_blk_zone_descriptor) { 6884f736650SSam Li .z_start = cpu_to_le64(data->zone_report_data.zones[j].start 6894f736650SSam Li >> BDRV_SECTOR_BITS), 6904f736650SSam Li .z_cap = cpu_to_le64(data->zone_report_data.zones[j].cap 6914f736650SSam Li >> BDRV_SECTOR_BITS), 6924f736650SSam Li .z_wp = cpu_to_le64(data->zone_report_data.zones[j].wp 6934f736650SSam Li >> BDRV_SECTOR_BITS), 6944f736650SSam Li }; 6954f736650SSam Li 6964f736650SSam Li switch (data->zone_report_data.zones[j].type) { 6974f736650SSam Li case BLK_ZT_CONV: 6984f736650SSam Li desc.z_type = VIRTIO_BLK_ZT_CONV; 6994f736650SSam Li break; 7004f736650SSam Li case BLK_ZT_SWR: 7014f736650SSam Li desc.z_type = VIRTIO_BLK_ZT_SWR; 7024f736650SSam Li break; 7034f736650SSam Li case BLK_ZT_SWP: 7044f736650SSam Li desc.z_type = VIRTIO_BLK_ZT_SWP; 7054f736650SSam Li break; 7064f736650SSam Li default: 7074f736650SSam Li g_assert_not_reached(); 7084f736650SSam Li } 7094f736650SSam Li 7104f736650SSam Li switch (data->zone_report_data.zones[j].state) { 7114f736650SSam Li case BLK_ZS_RDONLY: 7124f736650SSam Li desc.z_state = VIRTIO_BLK_ZS_RDONLY; 7134f736650SSam Li break; 7144f736650SSam Li case BLK_ZS_OFFLINE: 7154f736650SSam Li desc.z_state = VIRTIO_BLK_ZS_OFFLINE; 7164f736650SSam Li break; 7174f736650SSam Li case BLK_ZS_EMPTY: 7184f736650SSam Li desc.z_state = VIRTIO_BLK_ZS_EMPTY; 7194f736650SSam Li break; 7204f736650SSam Li case BLK_ZS_CLOSED: 7214f736650SSam Li desc.z_state = VIRTIO_BLK_ZS_CLOSED; 7224f736650SSam Li break; 7234f736650SSam Li case BLK_ZS_FULL: 7244f736650SSam Li desc.z_state = VIRTIO_BLK_ZS_FULL; 7254f736650SSam Li break; 7264f736650SSam Li case BLK_ZS_EOPEN: 7274f736650SSam Li desc.z_state = VIRTIO_BLK_ZS_EOPEN; 7284f736650SSam Li break; 7294f736650SSam Li case BLK_ZS_IOPEN: 7304f736650SSam Li desc.z_state = VIRTIO_BLK_ZS_IOPEN; 7314f736650SSam Li break; 7324f736650SSam Li case BLK_ZS_NOT_WP: 7334f736650SSam Li desc.z_state = VIRTIO_BLK_ZS_NOT_WP; 7344f736650SSam Li break; 7354f736650SSam Li default: 7364f736650SSam Li g_assert_not_reached(); 7374f736650SSam Li } 7384f736650SSam Li 7394f736650SSam Li /* TODO: it takes O(n^2) time complexity. Optimizations required. */ 7404f736650SSam Li n = iov_from_buf(in_iov, in_num, i, &desc, sizeof(desc)); 7414f736650SSam Li if (n != sizeof(desc)) { 7424f736650SSam Li virtio_error(vdev, "Driver provided input buffer " 7434f736650SSam Li "for descriptors that is too small!"); 7444f736650SSam Li err_status = VIRTIO_BLK_S_ZONE_INVALID_CMD; 7454f736650SSam Li } 7464f736650SSam Li } 7474f736650SSam Li 7484f736650SSam Li out: 7494f736650SSam Li virtio_blk_req_complete(req, err_status); 7504f736650SSam Li virtio_blk_free_request(req); 7514f736650SSam Li g_free(data->zone_report_data.zones); 7524f736650SSam Li g_free(data); 7534f736650SSam Li } 7544f736650SSam Li 7554f736650SSam Li static void virtio_blk_handle_zone_report(VirtIOBlockReq *req, 7564f736650SSam Li struct iovec *in_iov, 7574f736650SSam Li unsigned in_num) 7584f736650SSam Li { 7594f736650SSam Li VirtIOBlock *s = req->dev; 7604f736650SSam Li VirtIODevice *vdev = VIRTIO_DEVICE(s); 7614f736650SSam Li unsigned int nr_zones; 7624f736650SSam Li ZoneCmdData *data; 7634f736650SSam Li int64_t zone_size, offset; 7644f736650SSam Li uint8_t err_status; 7654f736650SSam Li 7664f736650SSam Li if (req->in_len < sizeof(struct virtio_blk_inhdr) + 7674f736650SSam Li sizeof(struct virtio_blk_zone_report) + 7684f736650SSam Li sizeof(struct virtio_blk_zone_descriptor)) { 7694f736650SSam Li virtio_error(vdev, "in buffer too small for zone report"); 7704f736650SSam Li return; 7714f736650SSam Li } 7724f736650SSam Li 7734f736650SSam Li /* start byte offset of the zone report */ 7744f736650SSam Li offset = virtio_ldq_p(vdev, &req->out.sector) << BDRV_SECTOR_BITS; 7754f736650SSam Li if (!check_zoned_request(s, offset, 0, false, &err_status)) { 7764f736650SSam Li goto out; 7774f736650SSam Li } 7784f736650SSam Li nr_zones = (req->in_len - sizeof(struct virtio_blk_inhdr) - 7794f736650SSam Li sizeof(struct virtio_blk_zone_report)) / 7804f736650SSam Li sizeof(struct virtio_blk_zone_descriptor); 7814e92acf7SSam Li trace_virtio_blk_handle_zone_report(vdev, req, 7824e92acf7SSam Li offset >> BDRV_SECTOR_BITS, nr_zones); 7834f736650SSam Li 7844f736650SSam Li zone_size = sizeof(BlockZoneDescriptor) * nr_zones; 7854f736650SSam Li data = g_malloc(sizeof(ZoneCmdData)); 7864f736650SSam Li data->req = req; 7874f736650SSam Li data->in_iov = in_iov; 7884f736650SSam Li data->in_num = in_num; 7894f736650SSam Li data->zone_report_data.nr_zones = nr_zones; 7904f736650SSam Li data->zone_report_data.zones = g_malloc(zone_size), 7914f736650SSam Li 7924f736650SSam Li blk_aio_zone_report(s->blk, offset, &data->zone_report_data.nr_zones, 7934f736650SSam Li data->zone_report_data.zones, 7944f736650SSam Li virtio_blk_zone_report_complete, data); 7954f736650SSam Li return; 7964f736650SSam Li out: 7974f736650SSam Li virtio_blk_req_complete(req, err_status); 7984f736650SSam Li virtio_blk_free_request(req); 7994f736650SSam Li } 8004f736650SSam Li 8014f736650SSam Li static void virtio_blk_zone_mgmt_complete(void *opaque, int ret) 8024f736650SSam Li { 8034f736650SSam Li VirtIOBlockReq *req = opaque; 8044f736650SSam Li VirtIOBlock *s = req->dev; 8054e92acf7SSam Li VirtIODevice *vdev = VIRTIO_DEVICE(s); 8064f736650SSam Li int8_t err_status = VIRTIO_BLK_S_OK; 8074e92acf7SSam Li trace_virtio_blk_zone_mgmt_complete(vdev, req,ret); 8084f736650SSam Li 8094f736650SSam Li if (ret) { 8104f736650SSam Li err_status = VIRTIO_BLK_S_ZONE_INVALID_CMD; 8114f736650SSam Li } 8124f736650SSam Li 8134f736650SSam Li virtio_blk_req_complete(req, err_status); 8144f736650SSam Li virtio_blk_free_request(req); 8154f736650SSam Li } 8164f736650SSam Li 8174f736650SSam Li static int virtio_blk_handle_zone_mgmt(VirtIOBlockReq *req, BlockZoneOp op) 8184f736650SSam Li { 8194f736650SSam Li VirtIOBlock *s = req->dev; 8204f736650SSam Li VirtIODevice *vdev = VIRTIO_DEVICE(s); 8214f736650SSam Li BlockDriverState *bs = blk_bs(s->blk); 8224f736650SSam Li int64_t offset = virtio_ldq_p(vdev, &req->out.sector) << BDRV_SECTOR_BITS; 8234f736650SSam Li uint64_t len; 8244f736650SSam Li uint64_t capacity = bs->total_sectors << BDRV_SECTOR_BITS; 8254f736650SSam Li uint8_t err_status = VIRTIO_BLK_S_OK; 8264f736650SSam Li 8274f736650SSam Li uint32_t type = virtio_ldl_p(vdev, &req->out.type); 8284f736650SSam Li if (type == VIRTIO_BLK_T_ZONE_RESET_ALL) { 8294f736650SSam Li /* Entire drive capacity */ 8304f736650SSam Li offset = 0; 8314f736650SSam Li len = capacity; 8324e92acf7SSam Li trace_virtio_blk_handle_zone_reset_all(vdev, req, 0, 8334e92acf7SSam Li bs->total_sectors); 8344f736650SSam Li } else { 8354f736650SSam Li if (bs->bl.zone_size > capacity - offset) { 8364f736650SSam Li /* The zoned device allows the last smaller zone. */ 8374f736650SSam Li len = capacity - bs->bl.zone_size * (bs->bl.nr_zones - 1); 8384f736650SSam Li } else { 8394f736650SSam Li len = bs->bl.zone_size; 8404f736650SSam Li } 8414e92acf7SSam Li trace_virtio_blk_handle_zone_mgmt(vdev, req, op, 8424e92acf7SSam Li offset >> BDRV_SECTOR_BITS, 8434e92acf7SSam Li len >> BDRV_SECTOR_BITS); 8444f736650SSam Li } 8454f736650SSam Li 8464f736650SSam Li if (!check_zoned_request(s, offset, len, false, &err_status)) { 8474f736650SSam Li goto out; 8484f736650SSam Li } 8494f736650SSam Li 8504f736650SSam Li blk_aio_zone_mgmt(s->blk, op, offset, len, 8514f736650SSam Li virtio_blk_zone_mgmt_complete, req); 8524f736650SSam Li 8534f736650SSam Li return 0; 8544f736650SSam Li out: 8554f736650SSam Li virtio_blk_req_complete(req, err_status); 8564f736650SSam Li virtio_blk_free_request(req); 8574f736650SSam Li return err_status; 8584f736650SSam Li } 8594f736650SSam Li 8604f736650SSam Li static void virtio_blk_zone_append_complete(void *opaque, int ret) 8614f736650SSam Li { 8624f736650SSam Li ZoneCmdData *data = opaque; 8634f736650SSam Li VirtIOBlockReq *req = data->req; 8644f736650SSam Li VirtIODevice *vdev = VIRTIO_DEVICE(req->dev); 8654f736650SSam Li int64_t append_sector, n; 8664f736650SSam Li uint8_t err_status = VIRTIO_BLK_S_OK; 8674f736650SSam Li 8684f736650SSam Li if (ret) { 8694f736650SSam Li err_status = VIRTIO_BLK_S_ZONE_INVALID_CMD; 8704f736650SSam Li goto out; 8714f736650SSam Li } 8724f736650SSam Li 8734f736650SSam Li virtio_stq_p(vdev, &append_sector, 8744f736650SSam Li data->zone_append_data.offset >> BDRV_SECTOR_BITS); 8754f736650SSam Li n = iov_from_buf(data->in_iov, data->in_num, 0, &append_sector, 8764f736650SSam Li sizeof(append_sector)); 8774f736650SSam Li if (n != sizeof(append_sector)) { 8784f736650SSam Li virtio_error(vdev, "Driver provided input buffer less than size of " 8794f736650SSam Li "append_sector"); 8804f736650SSam Li err_status = VIRTIO_BLK_S_ZONE_INVALID_CMD; 8814f736650SSam Li goto out; 8824f736650SSam Li } 8834e92acf7SSam Li trace_virtio_blk_zone_append_complete(vdev, req, append_sector, ret); 8844f736650SSam Li 8854f736650SSam Li out: 8864f736650SSam Li virtio_blk_req_complete(req, err_status); 8874f736650SSam Li virtio_blk_free_request(req); 8884f736650SSam Li g_free(data); 8894f736650SSam Li } 8904f736650SSam Li 8914f736650SSam Li static int virtio_blk_handle_zone_append(VirtIOBlockReq *req, 8924f736650SSam Li struct iovec *out_iov, 8934f736650SSam Li struct iovec *in_iov, 8944f736650SSam Li uint64_t out_num, 8954f736650SSam Li unsigned in_num) { 8964f736650SSam Li VirtIOBlock *s = req->dev; 8974f736650SSam Li VirtIODevice *vdev = VIRTIO_DEVICE(s); 8984f736650SSam Li uint8_t err_status = VIRTIO_BLK_S_OK; 8994f736650SSam Li 9004f736650SSam Li int64_t offset = virtio_ldq_p(vdev, &req->out.sector) << BDRV_SECTOR_BITS; 9014f736650SSam Li int64_t len = iov_size(out_iov, out_num); 9024f736650SSam Li 9034e92acf7SSam Li trace_virtio_blk_handle_zone_append(vdev, req, offset >> BDRV_SECTOR_BITS); 9044f736650SSam Li if (!check_zoned_request(s, offset, len, true, &err_status)) { 9054f736650SSam Li goto out; 9064f736650SSam Li } 9074f736650SSam Li 9084f736650SSam Li ZoneCmdData *data = g_malloc(sizeof(ZoneCmdData)); 9094f736650SSam Li data->req = req; 9104f736650SSam Li data->in_iov = in_iov; 9114f736650SSam Li data->in_num = in_num; 9124f736650SSam Li data->zone_append_data.offset = offset; 9134f736650SSam Li qemu_iovec_init_external(&req->qiov, out_iov, out_num); 91452eb76f4SSam Li 91552eb76f4SSam Li block_acct_start(blk_get_stats(s->blk), &req->acct, len, 91652eb76f4SSam Li BLOCK_ACCT_ZONE_APPEND); 91752eb76f4SSam Li 9184f736650SSam Li blk_aio_zone_append(s->blk, &data->zone_append_data.offset, &req->qiov, 0, 9194f736650SSam Li virtio_blk_zone_append_complete, data); 9204f736650SSam Li return 0; 9214f736650SSam Li 9224f736650SSam Li out: 9234f736650SSam Li virtio_blk_req_complete(req, err_status); 9244f736650SSam Li virtio_blk_free_request(req); 9254f736650SSam Li return err_status; 9264f736650SSam Li } 9274f736650SSam Li 92820ea686aSGreg Kurz static int virtio_blk_handle_request(VirtIOBlockReq *req, MultiReqBuffer *mrb) 9296e790746SPaolo Bonzini { 9306e790746SPaolo Bonzini uint32_t type; 931f897bf75SStefan Hajnoczi struct iovec *in_iov = req->elem.in_sg; 9325636da76SDongli Zhang struct iovec *out_iov = req->elem.out_sg; 933f897bf75SStefan Hajnoczi unsigned in_num = req->elem.in_num; 934f897bf75SStefan Hajnoczi unsigned out_num = req->elem.out_num; 93520ea686aSGreg Kurz VirtIOBlock *s = req->dev; 93620ea686aSGreg Kurz VirtIODevice *vdev = VIRTIO_DEVICE(s); 9376e790746SPaolo Bonzini 938f897bf75SStefan Hajnoczi if (req->elem.out_num < 1 || req->elem.in_num < 1) { 93920ea686aSGreg Kurz virtio_error(vdev, "virtio-blk missing headers"); 94020ea686aSGreg Kurz return -1; 9416e790746SPaolo Bonzini } 9426e790746SPaolo Bonzini 9435636da76SDongli Zhang if (unlikely(iov_to_buf(out_iov, out_num, 0, &req->out, 944827805a2SFam Zheng sizeof(req->out)) != sizeof(req->out))) { 94520ea686aSGreg Kurz virtio_error(vdev, "virtio-blk request outhdr too short"); 94620ea686aSGreg Kurz return -1; 947827805a2SFam Zheng } 948ee17e848SFam Zheng 9497bd04a04SStefan Hajnoczi iov_discard_front_undoable(&out_iov, &out_num, sizeof(req->out), 9507bd04a04SStefan Hajnoczi &req->outhdr_undo); 951ee17e848SFam Zheng 95212048545SGonglei if (in_iov[in_num - 1].iov_len < sizeof(struct virtio_blk_inhdr)) { 95320ea686aSGreg Kurz virtio_error(vdev, "virtio-blk request inhdr too short"); 9547bd04a04SStefan Hajnoczi iov_discard_undo(&req->outhdr_undo); 95520ea686aSGreg Kurz return -1; 956ee17e848SFam Zheng } 957ee17e848SFam Zheng 9582a6cdd6dSPaolo Bonzini /* We always touch the last byte, so just see how big in_iov is. */ 9592a6cdd6dSPaolo Bonzini req->in_len = iov_size(in_iov, in_num); 960ee17e848SFam Zheng req->in = (void *)in_iov[in_num - 1].iov_base 961ee17e848SFam Zheng + in_iov[in_num - 1].iov_len 962ee17e848SFam Zheng - sizeof(struct virtio_blk_inhdr); 9637bd04a04SStefan Hajnoczi iov_discard_back_undoable(in_iov, &in_num, sizeof(struct virtio_blk_inhdr), 9647bd04a04SStefan Hajnoczi &req->inhdr_undo); 9656e790746SPaolo Bonzini 9669a6719d5SStefano Garzarella type = virtio_ldl_p(vdev, &req->out.type); 9676e790746SPaolo Bonzini 96895f7142aSPeter Lieven /* VIRTIO_BLK_T_OUT defines the command direction. VIRTIO_BLK_T_BARRIER 969631b22eaSStefan Weil * is an optional flag. Although a guest should not send this flag if 97095f7142aSPeter Lieven * not negotiated we ignored it in the past. So keep ignoring it. */ 97195f7142aSPeter Lieven switch (type & ~(VIRTIO_BLK_T_OUT | VIRTIO_BLK_T_BARRIER)) { 97295f7142aSPeter Lieven case VIRTIO_BLK_T_IN: 97395f7142aSPeter Lieven { 97495f7142aSPeter Lieven bool is_write = type & VIRTIO_BLK_T_OUT; 9759a6719d5SStefano Garzarella req->sector_num = virtio_ldq_p(vdev, &req->out.sector); 97695f7142aSPeter Lieven 97795f7142aSPeter Lieven if (is_write) { 9785636da76SDongli Zhang qemu_iovec_init_external(&req->qiov, out_iov, out_num); 979a576ceacSStefan Hajnoczi trace_virtio_blk_handle_write(vdev, req, req->sector_num, 98095f7142aSPeter Lieven req->qiov.size / BDRV_SECTOR_SIZE); 98195f7142aSPeter Lieven } else { 98295f7142aSPeter Lieven qemu_iovec_init_external(&req->qiov, in_iov, in_num); 983a576ceacSStefan Hajnoczi trace_virtio_blk_handle_read(vdev, req, req->sector_num, 98495f7142aSPeter Lieven req->qiov.size / BDRV_SECTOR_SIZE); 98595f7142aSPeter Lieven } 98695f7142aSPeter Lieven 9879a6719d5SStefano Garzarella if (!virtio_blk_sect_range_ok(s, req->sector_num, req->qiov.size)) { 98895f7142aSPeter Lieven virtio_blk_req_complete(req, VIRTIO_BLK_S_IOERR); 9899a6719d5SStefano Garzarella block_acct_invalid(blk_get_stats(s->blk), 99001762e03SAlberto Garcia is_write ? BLOCK_ACCT_WRITE : BLOCK_ACCT_READ); 99195f7142aSPeter Lieven virtio_blk_free_request(req); 99220ea686aSGreg Kurz return 0; 99395f7142aSPeter Lieven } 99495f7142aSPeter Lieven 9959a6719d5SStefano Garzarella block_acct_start(blk_get_stats(s->blk), &req->acct, req->qiov.size, 99695f7142aSPeter Lieven is_write ? BLOCK_ACCT_WRITE : BLOCK_ACCT_READ); 99795f7142aSPeter Lieven 99895f7142aSPeter Lieven /* merge would exceed maximum number of requests or IO direction 99995f7142aSPeter Lieven * changes */ 100095f7142aSPeter Lieven if (mrb->num_reqs > 0 && (mrb->num_reqs == VIRTIO_BLK_MAX_MERGE_REQS || 1001c99495acSPeter Lieven is_write != mrb->is_write || 10029a6719d5SStefano Garzarella !s->conf.request_merging)) { 1003baf42268SStefan Hajnoczi virtio_blk_submit_multireq(s, mrb); 100495f7142aSPeter Lieven } 100595f7142aSPeter Lieven 100695f7142aSPeter Lieven assert(mrb->num_reqs < VIRTIO_BLK_MAX_MERGE_REQS); 100795f7142aSPeter Lieven mrb->reqs[mrb->num_reqs++] = req; 100895f7142aSPeter Lieven mrb->is_write = is_write; 100995f7142aSPeter Lieven break; 101095f7142aSPeter Lieven } 101195f7142aSPeter Lieven case VIRTIO_BLK_T_FLUSH: 10126e790746SPaolo Bonzini virtio_blk_handle_flush(req, mrb); 101395f7142aSPeter Lieven break; 10144f736650SSam Li case VIRTIO_BLK_T_ZONE_REPORT: 10154f736650SSam Li virtio_blk_handle_zone_report(req, in_iov, in_num); 10164f736650SSam Li break; 10174f736650SSam Li case VIRTIO_BLK_T_ZONE_OPEN: 10184f736650SSam Li virtio_blk_handle_zone_mgmt(req, BLK_ZO_OPEN); 10194f736650SSam Li break; 10204f736650SSam Li case VIRTIO_BLK_T_ZONE_CLOSE: 10214f736650SSam Li virtio_blk_handle_zone_mgmt(req, BLK_ZO_CLOSE); 10224f736650SSam Li break; 10234f736650SSam Li case VIRTIO_BLK_T_ZONE_FINISH: 10244f736650SSam Li virtio_blk_handle_zone_mgmt(req, BLK_ZO_FINISH); 10254f736650SSam Li break; 10264f736650SSam Li case VIRTIO_BLK_T_ZONE_RESET: 10274f736650SSam Li virtio_blk_handle_zone_mgmt(req, BLK_ZO_RESET); 10284f736650SSam Li break; 10294f736650SSam Li case VIRTIO_BLK_T_ZONE_RESET_ALL: 10304f736650SSam Li virtio_blk_handle_zone_mgmt(req, BLK_ZO_RESET); 10314f736650SSam Li break; 103295f7142aSPeter Lieven case VIRTIO_BLK_T_SCSI_CMD: 10336e790746SPaolo Bonzini virtio_blk_handle_scsi(req); 103495f7142aSPeter Lieven break; 103595f7142aSPeter Lieven case VIRTIO_BLK_T_GET_ID: 103695f7142aSPeter Lieven { 10376e790746SPaolo Bonzini /* 10386e790746SPaolo Bonzini * NB: per existing s/n string convention the string is 10396e790746SPaolo Bonzini * terminated by '\0' only when shorter than buffer. 10406e790746SPaolo Bonzini */ 10412a30307fSMarkus Armbruster const char *serial = s->conf.serial ? s->conf.serial : ""; 1042a83ceea8SMarc Marí size_t size = MIN(strlen(serial) + 1, 1043a83ceea8SMarc Marí MIN(iov_size(in_iov, in_num), 1044a83ceea8SMarc Marí VIRTIO_BLK_ID_BYTES)); 1045a83ceea8SMarc Marí iov_from_buf(in_iov, in_num, 0, serial, size); 10466e790746SPaolo Bonzini virtio_blk_req_complete(req, VIRTIO_BLK_S_OK); 1047671ec3f0SFam Zheng virtio_blk_free_request(req); 104895f7142aSPeter Lieven break; 104995f7142aSPeter Lieven } 10504f736650SSam Li case VIRTIO_BLK_T_ZONE_APPEND & ~VIRTIO_BLK_T_OUT: 10514f736650SSam Li /* 10524f736650SSam Li * Passing out_iov/out_num and in_iov/in_num is not safe 10534f736650SSam Li * to access req->elem.out_sg directly because it may be 10544f736650SSam Li * modified by virtio_blk_handle_request(). 10554f736650SSam Li */ 10564f736650SSam Li virtio_blk_handle_zone_append(req, out_iov, in_iov, out_num, in_num); 10574f736650SSam Li break; 105837b06f8dSStefano Garzarella /* 105937b06f8dSStefano Garzarella * VIRTIO_BLK_T_DISCARD and VIRTIO_BLK_T_WRITE_ZEROES are defined with 106037b06f8dSStefano Garzarella * VIRTIO_BLK_T_OUT flag set. We masked this flag in the switch statement, 106137b06f8dSStefano Garzarella * so we must mask it for these requests, then we will check if it is set. 106237b06f8dSStefano Garzarella */ 106337b06f8dSStefano Garzarella case VIRTIO_BLK_T_DISCARD & ~VIRTIO_BLK_T_OUT: 106437b06f8dSStefano Garzarella case VIRTIO_BLK_T_WRITE_ZEROES & ~VIRTIO_BLK_T_OUT: 106537b06f8dSStefano Garzarella { 106637b06f8dSStefano Garzarella struct virtio_blk_discard_write_zeroes dwz_hdr; 106737b06f8dSStefano Garzarella size_t out_len = iov_size(out_iov, out_num); 106837b06f8dSStefano Garzarella bool is_write_zeroes = (type & ~VIRTIO_BLK_T_BARRIER) == 106937b06f8dSStefano Garzarella VIRTIO_BLK_T_WRITE_ZEROES; 107037b06f8dSStefano Garzarella uint8_t err_status; 107137b06f8dSStefano Garzarella 107237b06f8dSStefano Garzarella /* 107337b06f8dSStefano Garzarella * Unsupported if VIRTIO_BLK_T_OUT is not set or the request contains 107437b06f8dSStefano Garzarella * more than one segment. 107537b06f8dSStefano Garzarella */ 107637b06f8dSStefano Garzarella if (unlikely(!(type & VIRTIO_BLK_T_OUT) || 107737b06f8dSStefano Garzarella out_len > sizeof(dwz_hdr))) { 107837b06f8dSStefano Garzarella virtio_blk_req_complete(req, VIRTIO_BLK_S_UNSUPP); 107937b06f8dSStefano Garzarella virtio_blk_free_request(req); 108037b06f8dSStefano Garzarella return 0; 108137b06f8dSStefano Garzarella } 108237b06f8dSStefano Garzarella 108337b06f8dSStefano Garzarella if (unlikely(iov_to_buf(out_iov, out_num, 0, &dwz_hdr, 108437b06f8dSStefano Garzarella sizeof(dwz_hdr)) != sizeof(dwz_hdr))) { 10857bd04a04SStefan Hajnoczi iov_discard_undo(&req->inhdr_undo); 10867bd04a04SStefan Hajnoczi iov_discard_undo(&req->outhdr_undo); 108737b06f8dSStefano Garzarella virtio_error(vdev, "virtio-blk discard/write_zeroes header" 108837b06f8dSStefano Garzarella " too short"); 108937b06f8dSStefano Garzarella return -1; 109037b06f8dSStefano Garzarella } 109137b06f8dSStefano Garzarella 109237b06f8dSStefano Garzarella err_status = virtio_blk_handle_discard_write_zeroes(req, &dwz_hdr, 109337b06f8dSStefano Garzarella is_write_zeroes); 109437b06f8dSStefano Garzarella if (err_status != VIRTIO_BLK_S_OK) { 109537b06f8dSStefano Garzarella virtio_blk_req_complete(req, err_status); 109637b06f8dSStefano Garzarella virtio_blk_free_request(req); 109737b06f8dSStefano Garzarella } 109837b06f8dSStefano Garzarella 109937b06f8dSStefano Garzarella break; 110037b06f8dSStefano Garzarella } 110195f7142aSPeter Lieven default: 11026e790746SPaolo Bonzini virtio_blk_req_complete(req, VIRTIO_BLK_S_UNSUPP); 1103671ec3f0SFam Zheng virtio_blk_free_request(req); 11046e790746SPaolo Bonzini } 110520ea686aSGreg Kurz return 0; 11066e790746SPaolo Bonzini } 11076e790746SPaolo Bonzini 1108186b9691SStefan Hajnoczi void virtio_blk_handle_vq(VirtIOBlock *s, VirtQueue *vq) 11096e790746SPaolo Bonzini { 11106e790746SPaolo Bonzini VirtIOBlockReq *req; 111195f7142aSPeter Lieven MultiReqBuffer mrb = {}; 1112d0435bc5SStefan Hajnoczi bool suppress_notifications = virtio_queue_get_notification(vq); 11136e790746SPaolo Bonzini 1114ccee48aaSStefan Hajnoczi defer_call_begin(); 1115fc73548eSStefan Hajnoczi 11169ef9d402SStefan Hajnoczi do { 1117d0435bc5SStefan Hajnoczi if (suppress_notifications) { 11189ef9d402SStefan Hajnoczi virtio_queue_set_notification(vq, 0); 1119d0435bc5SStefan Hajnoczi } 11209ef9d402SStefan Hajnoczi 1121edaffd9fSStefan Hajnoczi while ((req = virtio_blk_get_request(s, vq))) { 112220ea686aSGreg Kurz if (virtio_blk_handle_request(req, &mrb)) { 112320ea686aSGreg Kurz virtqueue_detach_element(req->vq, &req->elem, 0); 112420ea686aSGreg Kurz virtio_blk_free_request(req); 112520ea686aSGreg Kurz break; 112620ea686aSGreg Kurz } 11276e790746SPaolo Bonzini } 11286e790746SPaolo Bonzini 1129d0435bc5SStefan Hajnoczi if (suppress_notifications) { 11309ef9d402SStefan Hajnoczi virtio_queue_set_notification(vq, 1); 1131d0435bc5SStefan Hajnoczi } 11329ef9d402SStefan Hajnoczi } while (!virtio_queue_empty(vq)); 11339ef9d402SStefan Hajnoczi 113495f7142aSPeter Lieven if (mrb.num_reqs) { 1135baf42268SStefan Hajnoczi virtio_blk_submit_multireq(s, &mrb); 113695f7142aSPeter Lieven } 1137fc73548eSStefan Hajnoczi 1138ccee48aaSStefan Hajnoczi defer_call_end(); 11396e790746SPaolo Bonzini } 11406e790746SPaolo Bonzini 11418a2fad57SMichael S. Tsirkin static void virtio_blk_handle_output(VirtIODevice *vdev, VirtQueue *vq) 11428a2fad57SMichael S. Tsirkin { 11438a2fad57SMichael S. Tsirkin VirtIOBlock *s = (VirtIOBlock *)vdev; 11448a2fad57SMichael S. Tsirkin 1145186b9691SStefan Hajnoczi if (s->dataplane && !s->dataplane_started) { 11468a2fad57SMichael S. Tsirkin /* Some guests kick before setting VIRTIO_CONFIG_S_DRIVER_OK so start 11478a2fad57SMichael S. Tsirkin * dataplane here instead of waiting for .set_status(). 11488a2fad57SMichael S. Tsirkin */ 11499ffe337cSPaolo Bonzini virtio_device_start_ioeventfd(vdev); 11508a2fad57SMichael S. Tsirkin if (!s->dataplane_disabled) { 11518a2fad57SMichael S. Tsirkin return; 11528a2fad57SMichael S. Tsirkin } 11538a2fad57SMichael S. Tsirkin } 1154b6948ab0SStefan Hajnoczi 1155186b9691SStefan Hajnoczi virtio_blk_handle_vq(s, vq); 11568a2fad57SMichael S. Tsirkin } 11578a2fad57SMichael S. Tsirkin 1158a937f8e8SStefan Hajnoczi static void virtio_blk_dma_restart_bh(void *opaque) 11596e790746SPaolo Bonzini { 1160a937f8e8SStefan Hajnoczi VirtIOBlock *s = opaque; 1161a937f8e8SStefan Hajnoczi 11629c67f33fSStefan Hajnoczi VirtIOBlockReq *req; 116395f7142aSPeter Lieven MultiReqBuffer mrb = {}; 11646e790746SPaolo Bonzini 11659c67f33fSStefan Hajnoczi WITH_QEMU_LOCK_GUARD(&s->rq_lock) { 11669c67f33fSStefan Hajnoczi req = s->rq; 11676e790746SPaolo Bonzini s->rq = NULL; 11689c67f33fSStefan Hajnoczi } 11696e790746SPaolo Bonzini 11706e790746SPaolo Bonzini while (req) { 11711bdb176aSzhanghailiang VirtIOBlockReq *next = req->next; 117220ea686aSGreg Kurz if (virtio_blk_handle_request(req, &mrb)) { 117320ea686aSGreg Kurz /* Device is now broken and won't do any processing until it gets 117420ea686aSGreg Kurz * reset. Already queued requests will be lost: let's purge them. 117520ea686aSGreg Kurz */ 117620ea686aSGreg Kurz while (req) { 117720ea686aSGreg Kurz next = req->next; 117820ea686aSGreg Kurz virtqueue_detach_element(req->vq, &req->elem, 0); 117920ea686aSGreg Kurz virtio_blk_free_request(req); 118020ea686aSGreg Kurz req = next; 118120ea686aSGreg Kurz } 118220ea686aSGreg Kurz break; 118320ea686aSGreg Kurz } 11841bdb176aSzhanghailiang req = next; 11856e790746SPaolo Bonzini } 11866e790746SPaolo Bonzini 118795f7142aSPeter Lieven if (mrb.num_reqs) { 1188baf42268SStefan Hajnoczi virtio_blk_submit_multireq(s, &mrb); 118995f7142aSPeter Lieven } 1190a937f8e8SStefan Hajnoczi 1191a937f8e8SStefan Hajnoczi /* Paired with inc in virtio_blk_dma_restart_cb() */ 1192680f2002SKevin Wolf blk_dec_in_flight(s->conf.conf.blk); 11936e790746SPaolo Bonzini } 11946e790746SPaolo Bonzini 1195538f0497SPhilippe Mathieu-Daudé static void virtio_blk_dma_restart_cb(void *opaque, bool running, 11966e790746SPaolo Bonzini RunState state) 11976e790746SPaolo Bonzini { 11986e790746SPaolo Bonzini VirtIOBlock *s = opaque; 11996e790746SPaolo Bonzini 12006e790746SPaolo Bonzini if (!running) { 12016e790746SPaolo Bonzini return; 12026e790746SPaolo Bonzini } 12036e790746SPaolo Bonzini 1204a937f8e8SStefan Hajnoczi /* Paired with dec in virtio_blk_dma_restart_bh() */ 1205680f2002SKevin Wolf blk_inc_in_flight(s->conf.conf.blk); 1206a937f8e8SStefan Hajnoczi 1207a937f8e8SStefan Hajnoczi aio_bh_schedule_oneshot(blk_get_aio_context(s->conf.conf.blk), 1208a937f8e8SStefan Hajnoczi virtio_blk_dma_restart_bh, s); 12096e790746SPaolo Bonzini } 12106e790746SPaolo Bonzini 12116e790746SPaolo Bonzini static void virtio_blk_reset(VirtIODevice *vdev) 12126e790746SPaolo Bonzini { 12136e790746SPaolo Bonzini VirtIOBlock *s = VIRTIO_BLK(vdev); 121426307f6aSFam Zheng VirtIOBlockReq *req; 12156e790746SPaolo Bonzini 12169c67f33fSStefan Hajnoczi /* Dataplane has stopped... */ 12179c67f33fSStefan Hajnoczi assert(!s->dataplane_started); 12189c67f33fSStefan Hajnoczi 12199c67f33fSStefan Hajnoczi /* ...but requests may still be in flight. */ 12206e40b3bfSAlexander Yarygin blk_drain(s->blk); 12216e40b3bfSAlexander Yarygin 122226307f6aSFam Zheng /* We drop queued requests after blk_drain() because blk_drain() itself can 122326307f6aSFam Zheng * produce them. */ 12249c67f33fSStefan Hajnoczi WITH_QEMU_LOCK_GUARD(&s->rq_lock) { 122526307f6aSFam Zheng while (s->rq) { 122626307f6aSFam Zheng req = s->rq; 122726307f6aSFam Zheng s->rq = req->next; 12289c67f33fSStefan Hajnoczi 12299c67f33fSStefan Hajnoczi /* No other threads can access req->vq here */ 123097b93c8aSStefan Hajnoczi virtqueue_detach_element(req->vq, &req->elem, 0); 12319c67f33fSStefan Hajnoczi 123226307f6aSFam Zheng virtio_blk_free_request(req); 123326307f6aSFam Zheng } 12349c67f33fSStefan Hajnoczi } 123526307f6aSFam Zheng 12364be74634SMarkus Armbruster blk_set_enable_write_cache(s->blk, s->original_wce); 12376e790746SPaolo Bonzini } 12386e790746SPaolo Bonzini 12396e790746SPaolo Bonzini /* coalesce internal state, copy to pci i/o region 0 12406e790746SPaolo Bonzini */ 12416e790746SPaolo Bonzini static void virtio_blk_update_config(VirtIODevice *vdev, uint8_t *config) 12426e790746SPaolo Bonzini { 12436e790746SPaolo Bonzini VirtIOBlock *s = VIRTIO_BLK(vdev); 12442a30307fSMarkus Armbruster BlockConf *conf = &s->conf.conf; 12454f736650SSam Li BlockDriverState *bs = blk_bs(s->blk); 12466e790746SPaolo Bonzini struct virtio_blk_config blkcfg; 12476e790746SPaolo Bonzini uint64_t capacity; 124817d0bc01SStefan Hajnoczi int64_t length; 1249f7516731SMarkus Armbruster int blk_size = conf->logical_block_size; 12506e790746SPaolo Bonzini 12514be74634SMarkus Armbruster blk_get_geometry(s->blk, &capacity); 12526e790746SPaolo Bonzini memset(&blkcfg, 0, sizeof(blkcfg)); 1253783d1897SRusty Russell virtio_stq_p(vdev, &blkcfg.capacity, capacity); 12541bf8a989SDenis Plotnikov virtio_stl_p(vdev, &blkcfg.seg_max, 12551bf8a989SDenis Plotnikov s->conf.seg_max_adjust ? s->conf.queue_size - 2 : 128 - 2); 1256907eb3e5SMichael S. Tsirkin virtio_stw_p(vdev, &blkcfg.geometry.cylinders, conf->cyls); 1257783d1897SRusty Russell virtio_stl_p(vdev, &blkcfg.blk_size, blk_size); 1258f7516731SMarkus Armbruster virtio_stw_p(vdev, &blkcfg.min_io_size, conf->min_io_size / blk_size); 12596abee260SRoman Kagan virtio_stl_p(vdev, &blkcfg.opt_io_size, conf->opt_io_size / blk_size); 1260907eb3e5SMichael S. Tsirkin blkcfg.geometry.heads = conf->heads; 12616e790746SPaolo Bonzini /* 12626e790746SPaolo Bonzini * We must ensure that the block device capacity is a multiple of 1263e03ba136SPeter Maydell * the logical block size. If that is not the case, let's use 12646e790746SPaolo Bonzini * sector_mask to adopt the geometry to have a correct picture. 12656e790746SPaolo Bonzini * For those devices where the capacity is ok for the given geometry 1266e03ba136SPeter Maydell * we don't touch the sector value of the geometry, since some devices 12676e790746SPaolo Bonzini * (like s390 dasd) need a specific value. Here the capacity is already 12686e790746SPaolo Bonzini * cyls*heads*secs*blk_size and the sector value is not block size 12696e790746SPaolo Bonzini * divided by 512 - instead it is the amount of blk_size blocks 12706e790746SPaolo Bonzini * per track (cylinder). 12716e790746SPaolo Bonzini */ 127217d0bc01SStefan Hajnoczi length = blk_getlength(s->blk); 127317d0bc01SStefan Hajnoczi if (length > 0 && length / conf->heads / conf->secs % blk_size) { 1274907eb3e5SMichael S. Tsirkin blkcfg.geometry.sectors = conf->secs & ~s->sector_mask; 12756e790746SPaolo Bonzini } else { 1276907eb3e5SMichael S. Tsirkin blkcfg.geometry.sectors = conf->secs; 12776e790746SPaolo Bonzini } 12786e790746SPaolo Bonzini blkcfg.size_max = 0; 1279f7516731SMarkus Armbruster blkcfg.physical_block_exp = get_physical_block_exp(conf); 12806e790746SPaolo Bonzini blkcfg.alignment_offset = 0; 12814be74634SMarkus Armbruster blkcfg.wce = blk_enable_write_cache(s->blk); 12822f270590SStefan Hajnoczi virtio_stw_p(vdev, &blkcfg.num_queues, s->conf.num_queues); 128337b06f8dSStefano Garzarella if (virtio_has_feature(s->host_features, VIRTIO_BLK_F_DISCARD)) { 1284fb0b154cSAkihiko Odaki uint32_t discard_granularity = conf->discard_granularity; 1285fb0b154cSAkihiko Odaki if (discard_granularity == -1 || !s->conf.report_discard_granularity) { 1286fb0b154cSAkihiko Odaki discard_granularity = blk_size; 1287fb0b154cSAkihiko Odaki } 128837b06f8dSStefano Garzarella virtio_stl_p(vdev, &blkcfg.max_discard_sectors, 128937b06f8dSStefano Garzarella s->conf.max_discard_sectors); 129037b06f8dSStefano Garzarella virtio_stl_p(vdev, &blkcfg.discard_sector_alignment, 1291fb0b154cSAkihiko Odaki discard_granularity >> BDRV_SECTOR_BITS); 129237b06f8dSStefano Garzarella /* 129337b06f8dSStefano Garzarella * We support only one segment per request since multiple segments 129437b06f8dSStefano Garzarella * are not widely used and there are no userspace APIs that allow 129537b06f8dSStefano Garzarella * applications to submit multiple segments in a single call. 129637b06f8dSStefano Garzarella */ 129737b06f8dSStefano Garzarella virtio_stl_p(vdev, &blkcfg.max_discard_seg, 1); 129837b06f8dSStefano Garzarella } 129937b06f8dSStefano Garzarella if (virtio_has_feature(s->host_features, VIRTIO_BLK_F_WRITE_ZEROES)) { 130037b06f8dSStefano Garzarella virtio_stl_p(vdev, &blkcfg.max_write_zeroes_sectors, 130137b06f8dSStefano Garzarella s->conf.max_write_zeroes_sectors); 130237b06f8dSStefano Garzarella blkcfg.write_zeroes_may_unmap = 1; 130337b06f8dSStefano Garzarella virtio_stl_p(vdev, &blkcfg.max_write_zeroes_seg, 1); 130437b06f8dSStefano Garzarella } 13054f736650SSam Li if (bs->bl.zoned != BLK_Z_NONE) { 13064f736650SSam Li switch (bs->bl.zoned) { 13074f736650SSam Li case BLK_Z_HM: 13084f736650SSam Li blkcfg.zoned.model = VIRTIO_BLK_Z_HM; 13094f736650SSam Li break; 13104f736650SSam Li case BLK_Z_HA: 13114f736650SSam Li blkcfg.zoned.model = VIRTIO_BLK_Z_HA; 13124f736650SSam Li break; 13134f736650SSam Li default: 13144f736650SSam Li g_assert_not_reached(); 13154f736650SSam Li } 13164f736650SSam Li 13174f736650SSam Li virtio_stl_p(vdev, &blkcfg.zoned.zone_sectors, 13184f736650SSam Li bs->bl.zone_size / 512); 13194f736650SSam Li virtio_stl_p(vdev, &blkcfg.zoned.max_active_zones, 13204f736650SSam Li bs->bl.max_active_zones); 13214f736650SSam Li virtio_stl_p(vdev, &blkcfg.zoned.max_open_zones, 13224f736650SSam Li bs->bl.max_open_zones); 13234f736650SSam Li virtio_stl_p(vdev, &blkcfg.zoned.write_granularity, blk_size); 13244f736650SSam Li virtio_stl_p(vdev, &blkcfg.zoned.max_append_sectors, 13254f736650SSam Li bs->bl.max_append_sectors); 13264f736650SSam Li } else { 13274f736650SSam Li blkcfg.zoned.model = VIRTIO_BLK_Z_NONE; 13284f736650SSam Li } 132920764be0SStefano Garzarella memcpy(config, &blkcfg, s->config_size); 13306e790746SPaolo Bonzini } 13316e790746SPaolo Bonzini 13326e790746SPaolo Bonzini static void virtio_blk_set_config(VirtIODevice *vdev, const uint8_t *config) 13336e790746SPaolo Bonzini { 13346e790746SPaolo Bonzini VirtIOBlock *s = VIRTIO_BLK(vdev); 13356e790746SPaolo Bonzini struct virtio_blk_config blkcfg; 13366e790746SPaolo Bonzini 133720764be0SStefano Garzarella memcpy(&blkcfg, config, s->config_size); 13386d7e73d6SFam Zheng 13394be74634SMarkus Armbruster blk_set_enable_write_cache(s->blk, blkcfg.wce != 0); 13406e790746SPaolo Bonzini } 13416e790746SPaolo Bonzini 13429d5b731dSJason Wang static uint64_t virtio_blk_get_features(VirtIODevice *vdev, uint64_t features, 13439d5b731dSJason Wang Error **errp) 13446e790746SPaolo Bonzini { 13456e790746SPaolo Bonzini VirtIOBlock *s = VIRTIO_BLK(vdev); 13466e790746SPaolo Bonzini 1347bbe8bd4dSStefano Garzarella /* Firstly sync all virtio-blk possible supported features */ 1348bbe8bd4dSStefano Garzarella features |= s->host_features; 1349bbe8bd4dSStefano Garzarella 13500cd09c3aSCornelia Huck virtio_add_feature(&features, VIRTIO_BLK_F_SEG_MAX); 13510cd09c3aSCornelia Huck virtio_add_feature(&features, VIRTIO_BLK_F_GEOMETRY); 13520cd09c3aSCornelia Huck virtio_add_feature(&features, VIRTIO_BLK_F_TOPOLOGY); 13530cd09c3aSCornelia Huck virtio_add_feature(&features, VIRTIO_BLK_F_BLK_SIZE); 135495129d6fSCornelia Huck if (virtio_has_feature(features, VIRTIO_F_VERSION_1)) { 1355bbe8bd4dSStefano Garzarella if (virtio_has_feature(s->host_features, VIRTIO_BLK_F_SCSI)) { 1356efb8206cSJason Wang error_setg(errp, "Please set scsi=off for virtio-blk devices in order to use virtio 1.0"); 1357efb8206cSJason Wang return 0; 1358efb8206cSJason Wang } 1359efb8206cSJason Wang } else { 1360c9b11f97SJason Wang virtio_clear_feature(&features, VIRTIO_F_ANY_LAYOUT); 1361efb8206cSJason Wang virtio_add_feature(&features, VIRTIO_BLK_F_SCSI); 1362efb8206cSJason Wang } 13636e790746SPaolo Bonzini 13645f258577SEvgeny Yakovlev if (blk_enable_write_cache(s->blk) || 13655f258577SEvgeny Yakovlev (s->conf.x_enable_wce_if_config_wce && 13665f258577SEvgeny Yakovlev virtio_has_feature(features, VIRTIO_BLK_F_CONFIG_WCE))) { 13670cd09c3aSCornelia Huck virtio_add_feature(&features, VIRTIO_BLK_F_WCE); 13684be74634SMarkus Armbruster } 136986b1cf32SKevin Wolf if (!blk_is_writable(s->blk)) { 13700cd09c3aSCornelia Huck virtio_add_feature(&features, VIRTIO_BLK_F_RO); 13714be74634SMarkus Armbruster } 13722f270590SStefan Hajnoczi if (s->conf.num_queues > 1) { 13732f270590SStefan Hajnoczi virtio_add_feature(&features, VIRTIO_BLK_F_MQ); 13742f270590SStefan Hajnoczi } 13756e790746SPaolo Bonzini 13766e790746SPaolo Bonzini return features; 13776e790746SPaolo Bonzini } 13786e790746SPaolo Bonzini 13796e790746SPaolo Bonzini static void virtio_blk_set_status(VirtIODevice *vdev, uint8_t status) 13806e790746SPaolo Bonzini { 13816e790746SPaolo Bonzini VirtIOBlock *s = VIRTIO_BLK(vdev); 13826e790746SPaolo Bonzini 13839ffe337cSPaolo Bonzini if (!(status & (VIRTIO_CONFIG_S_DRIVER | VIRTIO_CONFIG_S_DRIVER_OK))) { 13849ffe337cSPaolo Bonzini assert(!s->dataplane_started); 13856e790746SPaolo Bonzini } 13866e790746SPaolo Bonzini 13876e790746SPaolo Bonzini if (!(status & VIRTIO_CONFIG_S_DRIVER_OK)) { 13886e790746SPaolo Bonzini return; 13896e790746SPaolo Bonzini } 13906e790746SPaolo Bonzini 1391ef5bc962SPaolo Bonzini /* A guest that supports VIRTIO_BLK_F_CONFIG_WCE must be able to send 1392ef5bc962SPaolo Bonzini * cache flushes. Thus, the "auto writethrough" behavior is never 1393ef5bc962SPaolo Bonzini * necessary for guests that support the VIRTIO_BLK_F_CONFIG_WCE feature. 1394ef5bc962SPaolo Bonzini * Leaving it enabled would break the following sequence: 1395ef5bc962SPaolo Bonzini * 1396ef5bc962SPaolo Bonzini * Guest started with "-drive cache=writethrough" 1397ef5bc962SPaolo Bonzini * Guest sets status to 0 1398ef5bc962SPaolo Bonzini * Guest sets DRIVER bit in status field 1399ef5bc962SPaolo Bonzini * Guest reads host features (WCE=0, CONFIG_WCE=1) 1400ef5bc962SPaolo Bonzini * Guest writes guest features (WCE=0, CONFIG_WCE=1) 1401ef5bc962SPaolo Bonzini * Guest writes 1 to the WCE configuration field (writeback mode) 1402ef5bc962SPaolo Bonzini * Guest sets DRIVER_OK bit in status field 1403ef5bc962SPaolo Bonzini * 14044be74634SMarkus Armbruster * s->blk would erroneously be placed in writethrough mode. 1405ef5bc962SPaolo Bonzini */ 140695129d6fSCornelia Huck if (!virtio_vdev_has_feature(vdev, VIRTIO_BLK_F_CONFIG_WCE)) { 14074be74634SMarkus Armbruster blk_set_enable_write_cache(s->blk, 140895129d6fSCornelia Huck virtio_vdev_has_feature(vdev, 140995129d6fSCornelia Huck VIRTIO_BLK_F_WCE)); 14106e790746SPaolo Bonzini } 1411ef5bc962SPaolo Bonzini } 14126e790746SPaolo Bonzini 1413b2b295a7SGreg Kurz static void virtio_blk_save_device(VirtIODevice *vdev, QEMUFile *f) 1414b2b295a7SGreg Kurz { 1415b2b295a7SGreg Kurz VirtIOBlock *s = VIRTIO_BLK(vdev); 14169c67f33fSStefan Hajnoczi 14179c67f33fSStefan Hajnoczi WITH_QEMU_LOCK_GUARD(&s->rq_lock) { 1418b2b295a7SGreg Kurz VirtIOBlockReq *req = s->rq; 14196e790746SPaolo Bonzini 14206e790746SPaolo Bonzini while (req) { 14216e790746SPaolo Bonzini qemu_put_sbyte(f, 1); 142230d8bf6dSStefan Hajnoczi 142330d8bf6dSStefan Hajnoczi if (s->conf.num_queues > 1) { 142430d8bf6dSStefan Hajnoczi qemu_put_be32(f, virtio_get_queue_index(req->vq)); 142530d8bf6dSStefan Hajnoczi } 142630d8bf6dSStefan Hajnoczi 142786044b24SJason Wang qemu_put_virtqueue_element(vdev, f, &req->elem); 14286e790746SPaolo Bonzini req = req->next; 14296e790746SPaolo Bonzini } 14309c67f33fSStefan Hajnoczi } 14319c67f33fSStefan Hajnoczi 14326e790746SPaolo Bonzini qemu_put_sbyte(f, 0); 14336e790746SPaolo Bonzini } 14346e790746SPaolo Bonzini 1435b2b295a7SGreg Kurz static int virtio_blk_load_device(VirtIODevice *vdev, QEMUFile *f, 1436b2b295a7SGreg Kurz int version_id) 1437b2b295a7SGreg Kurz { 1438b2b295a7SGreg Kurz VirtIOBlock *s = VIRTIO_BLK(vdev); 1439b2b295a7SGreg Kurz 14406e790746SPaolo Bonzini while (qemu_get_sbyte(f)) { 144130d8bf6dSStefan Hajnoczi unsigned nvqs = s->conf.num_queues; 144230d8bf6dSStefan Hajnoczi unsigned vq_idx = 0; 1443ab281c17SPaolo Bonzini VirtIOBlockReq *req; 144430d8bf6dSStefan Hajnoczi 144530d8bf6dSStefan Hajnoczi if (nvqs > 1) { 144630d8bf6dSStefan Hajnoczi vq_idx = qemu_get_be32(f); 144730d8bf6dSStefan Hajnoczi 144830d8bf6dSStefan Hajnoczi if (vq_idx >= nvqs) { 144930d8bf6dSStefan Hajnoczi error_report("Invalid virtqueue index in request list: %#x", 145030d8bf6dSStefan Hajnoczi vq_idx); 145130d8bf6dSStefan Hajnoczi return -EINVAL; 145230d8bf6dSStefan Hajnoczi } 145330d8bf6dSStefan Hajnoczi } 145430d8bf6dSStefan Hajnoczi 14558607f5c3SJason Wang req = qemu_get_virtqueue_element(vdev, f, sizeof(VirtIOBlockReq)); 145630d8bf6dSStefan Hajnoczi virtio_blk_init_request(s, virtio_get_queue(vdev, vq_idx), req); 14579c67f33fSStefan Hajnoczi 14589c67f33fSStefan Hajnoczi WITH_QEMU_LOCK_GUARD(&s->rq_lock) { 14596e790746SPaolo Bonzini req->next = s->rq; 14606e790746SPaolo Bonzini s->rq = req; 14616e790746SPaolo Bonzini } 14629c67f33fSStefan Hajnoczi } 14636e790746SPaolo Bonzini 14646e790746SPaolo Bonzini return 0; 14656e790746SPaolo Bonzini } 14666e790746SPaolo Bonzini 1467b6948ab0SStefan Hajnoczi static bool 1468b6948ab0SStefan Hajnoczi validate_iothread_vq_mapping_list(IOThreadVirtQueueMappingList *list, 1469b6948ab0SStefan Hajnoczi uint16_t num_queues, Error **errp) 1470b6948ab0SStefan Hajnoczi { 1471b6948ab0SStefan Hajnoczi g_autofree unsigned long *vqs = bitmap_new(num_queues); 1472b6948ab0SStefan Hajnoczi g_autoptr(GHashTable) iothreads = 1473b6948ab0SStefan Hajnoczi g_hash_table_new(g_str_hash, g_str_equal); 1474b6948ab0SStefan Hajnoczi 1475b6948ab0SStefan Hajnoczi for (IOThreadVirtQueueMappingList *node = list; node; node = node->next) { 1476b6948ab0SStefan Hajnoczi const char *name = node->value->iothread; 1477b6948ab0SStefan Hajnoczi uint16List *vq; 1478b6948ab0SStefan Hajnoczi 1479b6948ab0SStefan Hajnoczi if (!iothread_by_id(name)) { 1480b6948ab0SStefan Hajnoczi error_setg(errp, "IOThread \"%s\" object does not exist", name); 1481b6948ab0SStefan Hajnoczi return false; 1482b6948ab0SStefan Hajnoczi } 1483b6948ab0SStefan Hajnoczi 1484b6948ab0SStefan Hajnoczi if (!g_hash_table_add(iothreads, (gpointer)name)) { 1485b6948ab0SStefan Hajnoczi error_setg(errp, 1486b6948ab0SStefan Hajnoczi "duplicate IOThread name \"%s\" in iothread-vq-mapping", 1487b6948ab0SStefan Hajnoczi name); 1488b6948ab0SStefan Hajnoczi return false; 1489b6948ab0SStefan Hajnoczi } 1490b6948ab0SStefan Hajnoczi 1491b6948ab0SStefan Hajnoczi if (node != list) { 1492b6948ab0SStefan Hajnoczi if (!!node->value->vqs != !!list->value->vqs) { 1493b6948ab0SStefan Hajnoczi error_setg(errp, "either all items in iothread-vq-mapping " 1494b6948ab0SStefan Hajnoczi "must have vqs or none of them must have it"); 1495b6948ab0SStefan Hajnoczi return false; 1496b6948ab0SStefan Hajnoczi } 1497b6948ab0SStefan Hajnoczi } 1498b6948ab0SStefan Hajnoczi 1499b6948ab0SStefan Hajnoczi for (vq = node->value->vqs; vq; vq = vq->next) { 1500b6948ab0SStefan Hajnoczi if (vq->value >= num_queues) { 1501b6948ab0SStefan Hajnoczi error_setg(errp, "vq index %u for IOThread \"%s\" must be " 1502b6948ab0SStefan Hajnoczi "less than num_queues %u in iothread-vq-mapping", 1503b6948ab0SStefan Hajnoczi vq->value, name, num_queues); 1504b6948ab0SStefan Hajnoczi return false; 1505b6948ab0SStefan Hajnoczi } 1506b6948ab0SStefan Hajnoczi 1507b6948ab0SStefan Hajnoczi if (test_and_set_bit(vq->value, vqs)) { 1508b6948ab0SStefan Hajnoczi error_setg(errp, "cannot assign vq %u to IOThread \"%s\" " 1509b6948ab0SStefan Hajnoczi "because it is already assigned", vq->value, name); 1510b6948ab0SStefan Hajnoczi return false; 1511b6948ab0SStefan Hajnoczi } 1512b6948ab0SStefan Hajnoczi } 1513b6948ab0SStefan Hajnoczi } 1514b6948ab0SStefan Hajnoczi 1515b6948ab0SStefan Hajnoczi if (list->value->vqs) { 1516b6948ab0SStefan Hajnoczi for (uint16_t i = 0; i < num_queues; i++) { 1517b6948ab0SStefan Hajnoczi if (!test_bit(i, vqs)) { 1518b6948ab0SStefan Hajnoczi error_setg(errp, 1519b6948ab0SStefan Hajnoczi "missing vq %u IOThread assignment in iothread-vq-mapping", 1520b6948ab0SStefan Hajnoczi i); 1521b6948ab0SStefan Hajnoczi return false; 1522b6948ab0SStefan Hajnoczi } 1523b6948ab0SStefan Hajnoczi } 1524b6948ab0SStefan Hajnoczi } 1525b6948ab0SStefan Hajnoczi 1526b6948ab0SStefan Hajnoczi return true; 1527b6948ab0SStefan Hajnoczi } 1528b6948ab0SStefan Hajnoczi 15299b92fbcfSSergio Lopez static void virtio_resize_cb(void *opaque) 15309b92fbcfSSergio Lopez { 15319b92fbcfSSergio Lopez VirtIODevice *vdev = opaque; 15329b92fbcfSSergio Lopez 15339b92fbcfSSergio Lopez assert(qemu_get_current_aio_context() == qemu_get_aio_context()); 15349b92fbcfSSergio Lopez virtio_notify_config(vdev); 15359b92fbcfSSergio Lopez } 15369b92fbcfSSergio Lopez 15376e790746SPaolo Bonzini static void virtio_blk_resize(void *opaque) 15386e790746SPaolo Bonzini { 15396e790746SPaolo Bonzini VirtIODevice *vdev = VIRTIO_DEVICE(opaque); 15406e790746SPaolo Bonzini 15419b92fbcfSSergio Lopez /* 15429b92fbcfSSergio Lopez * virtio_notify_config() needs to acquire the global mutex, 15439b92fbcfSSergio Lopez * so it can't be called from an iothread. Instead, schedule 15449b92fbcfSSergio Lopez * it to be run in the main context BH. 15459b92fbcfSSergio Lopez */ 15469b92fbcfSSergio Lopez aio_bh_schedule_oneshot(qemu_get_aio_context(), virtio_resize_cb, vdev); 15476e790746SPaolo Bonzini } 15486e790746SPaolo Bonzini 15491665d932SStefan Hajnoczi /* Suspend virtqueue ioeventfd processing during drain */ 15501665d932SStefan Hajnoczi static void virtio_blk_drained_begin(void *opaque) 15511665d932SStefan Hajnoczi { 15521665d932SStefan Hajnoczi VirtIOBlock *s = opaque; 15531665d932SStefan Hajnoczi 15541665d932SStefan Hajnoczi if (!s->dataplane || !s->dataplane_started) { 15551665d932SStefan Hajnoczi return; 15561665d932SStefan Hajnoczi } 15571665d932SStefan Hajnoczi 1558b6948ab0SStefan Hajnoczi virtio_blk_data_plane_detach(s->dataplane); 15591665d932SStefan Hajnoczi } 15601665d932SStefan Hajnoczi 15611665d932SStefan Hajnoczi /* Resume virtqueue ioeventfd processing after drain */ 15621665d932SStefan Hajnoczi static void virtio_blk_drained_end(void *opaque) 15631665d932SStefan Hajnoczi { 15641665d932SStefan Hajnoczi VirtIOBlock *s = opaque; 15651665d932SStefan Hajnoczi 15661665d932SStefan Hajnoczi if (!s->dataplane || !s->dataplane_started) { 15671665d932SStefan Hajnoczi return; 15681665d932SStefan Hajnoczi } 15691665d932SStefan Hajnoczi 1570b6948ab0SStefan Hajnoczi virtio_blk_data_plane_attach(s->dataplane); 15711665d932SStefan Hajnoczi } 15721665d932SStefan Hajnoczi 15736e790746SPaolo Bonzini static const BlockDevOps virtio_block_ops = { 15746e790746SPaolo Bonzini .resize_cb = virtio_blk_resize, 15751665d932SStefan Hajnoczi .drained_begin = virtio_blk_drained_begin, 15761665d932SStefan Hajnoczi .drained_end = virtio_blk_drained_end, 15776e790746SPaolo Bonzini }; 15786e790746SPaolo Bonzini 157975884afdSAndreas Färber static void virtio_blk_device_realize(DeviceState *dev, Error **errp) 15806e790746SPaolo Bonzini { 158175884afdSAndreas Färber VirtIODevice *vdev = VIRTIO_DEVICE(dev); 1582179b417eSAndreas Färber VirtIOBlock *s = VIRTIO_BLK(dev); 15832a30307fSMarkus Armbruster VirtIOBlkConf *conf = &s->conf; 15843ffeeef7SAndreas Färber Error *err = NULL; 15852f270590SStefan Hajnoczi unsigned i; 15866e790746SPaolo Bonzini 15874be74634SMarkus Armbruster if (!conf->conf.blk) { 158875884afdSAndreas Färber error_setg(errp, "drive property not set"); 158975884afdSAndreas Färber return; 15906e790746SPaolo Bonzini } 15914be74634SMarkus Armbruster if (!blk_is_inserted(conf->conf.blk)) { 159275884afdSAndreas Färber error_setg(errp, "Device needs media, but drive is empty"); 159375884afdSAndreas Färber return; 15946e790746SPaolo Bonzini } 15959445e1e1SStefan Hajnoczi if (conf->num_queues == VIRTIO_BLK_AUTO_NUM_QUEUES) { 15969445e1e1SStefan Hajnoczi conf->num_queues = 1; 15979445e1e1SStefan Hajnoczi } 15982f270590SStefan Hajnoczi if (!conf->num_queues) { 15992f270590SStefan Hajnoczi error_setg(errp, "num-queues property must be larger than 0"); 16002f270590SStefan Hajnoczi return; 16012f270590SStefan Hajnoczi } 16021bf8a989SDenis Plotnikov if (conf->queue_size <= 2) { 16031bf8a989SDenis Plotnikov error_setg(errp, "invalid queue-size property (%" PRIu16 "), " 16041bf8a989SDenis Plotnikov "must be > 2", conf->queue_size); 16051bf8a989SDenis Plotnikov return; 16061bf8a989SDenis Plotnikov } 16076040aeddSMark Kanda if (!is_power_of_2(conf->queue_size) || 16086040aeddSMark Kanda conf->queue_size > VIRTQUEUE_MAX_SIZE) { 16096040aeddSMark Kanda error_setg(errp, "invalid queue-size property (%" PRIu16 "), " 16106040aeddSMark Kanda "must be a power of 2 (max %d)", 16116040aeddSMark Kanda conf->queue_size, VIRTQUEUE_MAX_SIZE); 16126040aeddSMark Kanda return; 16136040aeddSMark Kanda } 16146e790746SPaolo Bonzini 1615ceff3e1fSMao Zhongyi if (!blkconf_apply_backend_options(&conf->conf, 161686b1cf32SKevin Wolf !blk_supports_write_perm(conf->conf.blk), 161786b1cf32SKevin Wolf true, errp)) { 1618a17c17a2SKevin Wolf return; 1619a17c17a2SKevin Wolf } 16204be74634SMarkus Armbruster s->original_wce = blk_enable_write_cache(conf->conf.blk); 1621ceff3e1fSMao Zhongyi if (!blkconf_geometry(&conf->conf, NULL, 65535, 255, 255, errp)) { 162275884afdSAndreas Färber return; 16236e790746SPaolo Bonzini } 1624ceff3e1fSMao Zhongyi 1625c56ee92fSRoman Kagan if (!blkconf_blocksizes(&conf->conf, errp)) { 16260a75b60cSMark Kanda return; 16270a75b60cSMark Kanda } 16280a75b60cSMark Kanda 16294f736650SSam Li BlockDriverState *bs = blk_bs(conf->conf.blk); 16304f736650SSam Li if (bs->bl.zoned != BLK_Z_NONE) { 16314f736650SSam Li virtio_add_feature(&s->host_features, VIRTIO_BLK_F_ZONED); 16324f736650SSam Li if (bs->bl.zoned == BLK_Z_HM) { 16334f736650SSam Li virtio_clear_feature(&s->host_features, VIRTIO_BLK_F_DISCARD); 16344f736650SSam Li } 16354f736650SSam Li } 16364f736650SSam Li 163737b06f8dSStefano Garzarella if (virtio_has_feature(s->host_features, VIRTIO_BLK_F_DISCARD) && 163837b06f8dSStefano Garzarella (!conf->max_discard_sectors || 163937b06f8dSStefano Garzarella conf->max_discard_sectors > BDRV_REQUEST_MAX_SECTORS)) { 164037b06f8dSStefano Garzarella error_setg(errp, "invalid max-discard-sectors property (%" PRIu32 ")" 164137b06f8dSStefano Garzarella ", must be between 1 and %d", 164237b06f8dSStefano Garzarella conf->max_discard_sectors, (int)BDRV_REQUEST_MAX_SECTORS); 164337b06f8dSStefano Garzarella return; 164437b06f8dSStefano Garzarella } 164537b06f8dSStefano Garzarella 164637b06f8dSStefano Garzarella if (virtio_has_feature(s->host_features, VIRTIO_BLK_F_WRITE_ZEROES) && 164737b06f8dSStefano Garzarella (!conf->max_write_zeroes_sectors || 164837b06f8dSStefano Garzarella conf->max_write_zeroes_sectors > BDRV_REQUEST_MAX_SECTORS)) { 164937b06f8dSStefano Garzarella error_setg(errp, "invalid max-write-zeroes-sectors property (%" PRIu32 165037b06f8dSStefano Garzarella "), must be between 1 and %d", 165137b06f8dSStefano Garzarella conf->max_write_zeroes_sectors, 165237b06f8dSStefano Garzarella (int)BDRV_REQUEST_MAX_SECTORS); 165337b06f8dSStefano Garzarella return; 165437b06f8dSStefano Garzarella } 165537b06f8dSStefano Garzarella 1656b6948ab0SStefan Hajnoczi if (conf->iothread_vq_mapping_list) { 1657b6948ab0SStefan Hajnoczi if (conf->iothread) { 1658b6948ab0SStefan Hajnoczi error_setg(errp, "iothread and iothread-vq-mapping properties " 1659b6948ab0SStefan Hajnoczi "cannot be set at the same time"); 1660b6948ab0SStefan Hajnoczi return; 1661b6948ab0SStefan Hajnoczi } 1662b6948ab0SStefan Hajnoczi 1663b6948ab0SStefan Hajnoczi if (!validate_iothread_vq_mapping_list(conf->iothread_vq_mapping_list, 1664b6948ab0SStefan Hajnoczi conf->num_queues, errp)) { 1665b6948ab0SStefan Hajnoczi return; 1666b6948ab0SStefan Hajnoczi } 1667b6948ab0SStefan Hajnoczi } 1668b6948ab0SStefan Hajnoczi 1669d9cf55a8SDaniil Tatianin s->config_size = virtio_get_config_size(&virtio_blk_cfg_size_params, 1670d74c30c8SDaniil Tatianin s->host_features); 16713857cd5cSJonah Palmer virtio_init(vdev, VIRTIO_ID_BLOCK, s->config_size); 16726e790746SPaolo Bonzini 16739c67f33fSStefan Hajnoczi qemu_mutex_init(&s->rq_lock); 16749c67f33fSStefan Hajnoczi 16754be74634SMarkus Armbruster s->blk = conf->conf.blk; 16766e790746SPaolo Bonzini s->rq = NULL; 16772a30307fSMarkus Armbruster s->sector_mask = (s->conf.conf.logical_block_size / BDRV_SECTOR_SIZE) - 1; 16786e790746SPaolo Bonzini 16792f270590SStefan Hajnoczi for (i = 0; i < conf->num_queues; i++) { 16806040aeddSMark Kanda virtio_add_queue(vdev, conf->queue_size, virtio_blk_handle_output); 16812f270590SStefan Hajnoczi } 168298e3ab35SKevin Wolf qemu_coroutine_inc_pool_size(conf->num_queues * conf->queue_size / 2); 16832a30307fSMarkus Armbruster virtio_blk_data_plane_create(vdev, conf, &s->dataplane, &err); 16843ffeeef7SAndreas Färber if (err != NULL) { 168575884afdSAndreas Färber error_propagate(errp, err); 1686cfaf757eSPan Nengyuan for (i = 0; i < conf->num_queues; i++) { 1687cfaf757eSPan Nengyuan virtio_del_queue(vdev, i); 1688cfaf757eSPan Nengyuan } 16896a1a8cc7SKONRAD Frederic virtio_cleanup(vdev); 169075884afdSAndreas Färber return; 16916e790746SPaolo Bonzini } 16926e790746SPaolo Bonzini 1693a937f8e8SStefan Hajnoczi /* 1694a937f8e8SStefan Hajnoczi * This must be after virtio_init() so virtio_blk_dma_restart_cb() gets 1695a937f8e8SStefan Hajnoczi * called after ->start_ioeventfd() has already set blk's AioContext. 1696a937f8e8SStefan Hajnoczi */ 1697a937f8e8SStefan Hajnoczi s->change = 1698a937f8e8SStefan Hajnoczi qdev_add_vm_change_state_handler(dev, virtio_blk_dma_restart_cb, s); 1699a937f8e8SStefan Hajnoczi 1700baf42268SStefan Hajnoczi blk_ram_registrar_init(&s->blk_ram_registrar, s->blk); 17014be74634SMarkus Armbruster blk_set_dev_ops(s->blk, &virtio_block_ops, s); 17026e790746SPaolo Bonzini 17034be74634SMarkus Armbruster blk_iostatus_enable(s->blk); 170471f571a2SSam Eiderman 170571f571a2SSam Eiderman add_boot_device_lchs(dev, "/disk@0,0", 170671f571a2SSam Eiderman conf->conf.lcyls, 170771f571a2SSam Eiderman conf->conf.lheads, 170871f571a2SSam Eiderman conf->conf.lsecs); 17096e790746SPaolo Bonzini } 17106e790746SPaolo Bonzini 1711b69c3c21SMarkus Armbruster static void virtio_blk_device_unrealize(DeviceState *dev) 17126e790746SPaolo Bonzini { 1713306ec6c3SAndreas Färber VirtIODevice *vdev = VIRTIO_DEVICE(dev); 1714306ec6c3SAndreas Färber VirtIOBlock *s = VIRTIO_BLK(dev); 17154a0117cfSEugenio Pérez VirtIOBlkConf *conf = &s->conf; 17164a0117cfSEugenio Pérez unsigned i; 1717306ec6c3SAndreas Färber 17187bfde688SJulia Suvorova blk_drain(s->blk); 171971f571a2SSam Eiderman del_boot_device_lchs(dev, "/disk@0,0"); 17206e790746SPaolo Bonzini virtio_blk_data_plane_destroy(s->dataplane); 17216e790746SPaolo Bonzini s->dataplane = NULL; 17224a0117cfSEugenio Pérez for (i = 0; i < conf->num_queues; i++) { 17234a0117cfSEugenio Pérez virtio_del_queue(vdev, i); 17244a0117cfSEugenio Pérez } 172598e3ab35SKevin Wolf qemu_coroutine_dec_pool_size(conf->num_queues * conf->queue_size / 2); 17269c67f33fSStefan Hajnoczi qemu_mutex_destroy(&s->rq_lock); 1727baf42268SStefan Hajnoczi blk_ram_registrar_destroy(&s->blk_ram_registrar); 17286e790746SPaolo Bonzini qemu_del_vm_change_state_handler(s->change); 17294be74634SMarkus Armbruster blockdev_mark_auto_del(s->blk); 17306a1a8cc7SKONRAD Frederic virtio_cleanup(vdev); 17316e790746SPaolo Bonzini } 17326e790746SPaolo Bonzini 1733467b3f33SStefan Hajnoczi static void virtio_blk_instance_init(Object *obj) 1734467b3f33SStefan Hajnoczi { 1735467b3f33SStefan Hajnoczi VirtIOBlock *s = VIRTIO_BLK(obj); 1736467b3f33SStefan Hajnoczi 17372a30307fSMarkus Armbruster device_add_bootindex_property(obj, &s->conf.conf.bootindex, 17383342ec32SGonglei "bootindex", "/disk@0,0", 173940c2281cSMarkus Armbruster DEVICE(obj)); 1740467b3f33SStefan Hajnoczi } 1741467b3f33SStefan Hajnoczi 1742977a117fSHalil Pasic static const VMStateDescription vmstate_virtio_blk = { 1743977a117fSHalil Pasic .name = "virtio-blk", 1744977a117fSHalil Pasic .minimum_version_id = 2, 1745977a117fSHalil Pasic .version_id = 2, 1746*7d5dc0a3SRichard Henderson .fields = (const VMStateField[]) { 1747977a117fSHalil Pasic VMSTATE_VIRTIO_DEVICE, 1748977a117fSHalil Pasic VMSTATE_END_OF_LIST() 1749977a117fSHalil Pasic }, 1750977a117fSHalil Pasic }; 1751bbded32cSDr. David Alan Gilbert 17526e790746SPaolo Bonzini static Property virtio_blk_properties[] = { 17532a30307fSMarkus Armbruster DEFINE_BLOCK_PROPERTIES(VirtIOBlock, conf.conf), 17548c398252SKevin Wolf DEFINE_BLOCK_ERROR_PROPERTIES(VirtIOBlock, conf.conf), 17552a30307fSMarkus Armbruster DEFINE_BLOCK_CHS_PROPERTIES(VirtIOBlock, conf.conf), 17562a30307fSMarkus Armbruster DEFINE_PROP_STRING("serial", VirtIOBlock, conf.serial), 1757bbe8bd4dSStefano Garzarella DEFINE_PROP_BIT64("config-wce", VirtIOBlock, host_features, 1758bbe8bd4dSStefano Garzarella VIRTIO_BLK_F_CONFIG_WCE, true), 175932a877e4SStefan Hajnoczi #ifdef __linux__ 1760bbe8bd4dSStefano Garzarella DEFINE_PROP_BIT64("scsi", VirtIOBlock, host_features, 1761bbe8bd4dSStefano Garzarella VIRTIO_BLK_F_SCSI, false), 176232a877e4SStefan Hajnoczi #endif 1763c99495acSPeter Lieven DEFINE_PROP_BIT("request-merging", VirtIOBlock, conf.request_merging, 0, 1764c99495acSPeter Lieven true), 17659445e1e1SStefan Hajnoczi DEFINE_PROP_UINT16("num-queues", VirtIOBlock, conf.num_queues, 17669445e1e1SStefan Hajnoczi VIRTIO_BLK_AUTO_NUM_QUEUES), 1767c9b7d9ecSDenis Plotnikov DEFINE_PROP_UINT16("queue-size", VirtIOBlock, conf.queue_size, 256), 17681bf8a989SDenis Plotnikov DEFINE_PROP_BOOL("seg-max-adjust", VirtIOBlock, conf.seg_max_adjust, true), 1769d679ac09SFam Zheng DEFINE_PROP_LINK("iothread", VirtIOBlock, conf.iothread, TYPE_IOTHREAD, 1770d679ac09SFam Zheng IOThread *), 1771b6948ab0SStefan Hajnoczi DEFINE_PROP_IOTHREAD_VQ_MAPPING_LIST("iothread-vq-mapping", VirtIOBlock, 1772b6948ab0SStefan Hajnoczi conf.iothread_vq_mapping_list), 17735c81161fSStefano Garzarella DEFINE_PROP_BIT64("discard", VirtIOBlock, host_features, 17745c81161fSStefano Garzarella VIRTIO_BLK_F_DISCARD, true), 1775fb0b154cSAkihiko Odaki DEFINE_PROP_BOOL("report-discard-granularity", VirtIOBlock, 1776fb0b154cSAkihiko Odaki conf.report_discard_granularity, true), 17775c81161fSStefano Garzarella DEFINE_PROP_BIT64("write-zeroes", VirtIOBlock, host_features, 17785c81161fSStefano Garzarella VIRTIO_BLK_F_WRITE_ZEROES, true), 177937b06f8dSStefano Garzarella DEFINE_PROP_UINT32("max-discard-sectors", VirtIOBlock, 178037b06f8dSStefano Garzarella conf.max_discard_sectors, BDRV_REQUEST_MAX_SECTORS), 178137b06f8dSStefano Garzarella DEFINE_PROP_UINT32("max-write-zeroes-sectors", VirtIOBlock, 178237b06f8dSStefano Garzarella conf.max_write_zeroes_sectors, BDRV_REQUEST_MAX_SECTORS), 17835f258577SEvgeny Yakovlev DEFINE_PROP_BOOL("x-enable-wce-if-config-wce", VirtIOBlock, 17845f258577SEvgeny Yakovlev conf.x_enable_wce_if_config_wce, true), 17856e790746SPaolo Bonzini DEFINE_PROP_END_OF_LIST(), 17866e790746SPaolo Bonzini }; 17876e790746SPaolo Bonzini 17886e790746SPaolo Bonzini static void virtio_blk_class_init(ObjectClass *klass, void *data) 17896e790746SPaolo Bonzini { 17906e790746SPaolo Bonzini DeviceClass *dc = DEVICE_CLASS(klass); 17916e790746SPaolo Bonzini VirtioDeviceClass *vdc = VIRTIO_DEVICE_CLASS(klass); 179275884afdSAndreas Färber 17934f67d30bSMarc-André Lureau device_class_set_props(dc, virtio_blk_properties); 1794bbded32cSDr. David Alan Gilbert dc->vmsd = &vmstate_virtio_blk; 1795125ee0edSMarcel Apfelbaum set_bit(DEVICE_CATEGORY_STORAGE, dc->categories); 179675884afdSAndreas Färber vdc->realize = virtio_blk_device_realize; 1797306ec6c3SAndreas Färber vdc->unrealize = virtio_blk_device_unrealize; 17986e790746SPaolo Bonzini vdc->get_config = virtio_blk_update_config; 17996e790746SPaolo Bonzini vdc->set_config = virtio_blk_set_config; 18006e790746SPaolo Bonzini vdc->get_features = virtio_blk_get_features; 18016e790746SPaolo Bonzini vdc->set_status = virtio_blk_set_status; 18026e790746SPaolo Bonzini vdc->reset = virtio_blk_reset; 1803b2b295a7SGreg Kurz vdc->save = virtio_blk_save_device; 1804b2b295a7SGreg Kurz vdc->load = virtio_blk_load_device; 18059ffe337cSPaolo Bonzini vdc->start_ioeventfd = virtio_blk_data_plane_start; 18069ffe337cSPaolo Bonzini vdc->stop_ioeventfd = virtio_blk_data_plane_stop; 18076e790746SPaolo Bonzini } 18086e790746SPaolo Bonzini 1809b5c7ceafSChanglong Xie static const TypeInfo virtio_blk_info = { 18106e790746SPaolo Bonzini .name = TYPE_VIRTIO_BLK, 18116e790746SPaolo Bonzini .parent = TYPE_VIRTIO_DEVICE, 18126e790746SPaolo Bonzini .instance_size = sizeof(VirtIOBlock), 1813467b3f33SStefan Hajnoczi .instance_init = virtio_blk_instance_init, 18146e790746SPaolo Bonzini .class_init = virtio_blk_class_init, 18156e790746SPaolo Bonzini }; 18166e790746SPaolo Bonzini 18176e790746SPaolo Bonzini static void virtio_register_types(void) 18186e790746SPaolo Bonzini { 1819b5c7ceafSChanglong Xie type_register_static(&virtio_blk_info); 18206e790746SPaolo Bonzini } 18216e790746SPaolo Bonzini 18226e790746SPaolo Bonzini type_init(virtio_register_types) 1823