1 /*
2 * Dedicated thread for virtio-blk I/O processing
3 *
4 * Copyright 2012 IBM, Corp.
5 * Copyright 2012 Red Hat, Inc. and/or its affiliates
6 *
7 * Authors:
8 * Stefan Hajnoczi <stefanha@redhat.com>
9 *
10 * This work is licensed under the terms of the GNU GPL, version 2 or later.
11 * See the COPYING file in the top-level directory.
12 *
13 */
14
15 #include "qemu/osdep.h"
16 #include "qapi/error.h"
17 #include "trace.h"
18 #include "qemu/iov.h"
19 #include "qemu/main-loop.h"
20 #include "qemu/thread.h"
21 #include "qemu/error-report.h"
22 #include "hw/virtio/virtio-access.h"
23 #include "hw/virtio/virtio-blk.h"
24 #include "virtio-blk.h"
25 #include "block/aio.h"
26 #include "hw/virtio/virtio-bus.h"
27 #include "qom/object_interfaces.h"
28
29 struct VirtIOBlockDataPlane {
30 bool starting;
31 bool stopping;
32
33 VirtIOBlkConf *conf;
34 VirtIODevice *vdev;
35 QEMUBH *bh; /* bh for guest notification */
36 unsigned long *batch_notify_vqs;
37 bool batch_notifications;
38
39 /* Note that these EventNotifiers are assigned by value. This is
40 * fine as long as you do not call event_notifier_cleanup on them
41 * (because you don't own the file descriptor or handle; you just
42 * use it).
43 */
44 IOThread *iothread;
45 AioContext *ctx;
46 };
47
48 /* Raise an interrupt to signal guest, if necessary */
virtio_blk_data_plane_notify(VirtIOBlockDataPlane * s,VirtQueue * vq)49 void virtio_blk_data_plane_notify(VirtIOBlockDataPlane *s, VirtQueue *vq)
50 {
51 if (s->batch_notifications) {
52 set_bit(virtio_get_queue_index(vq), s->batch_notify_vqs);
53 qemu_bh_schedule(s->bh);
54 } else {
55 virtio_notify_irqfd(s->vdev, vq);
56 }
57 }
58
notify_guest_bh(void * opaque)59 static void notify_guest_bh(void *opaque)
60 {
61 VirtIOBlockDataPlane *s = opaque;
62 unsigned nvqs = s->conf->num_queues;
63 unsigned long bitmap[BITS_TO_LONGS(nvqs)];
64 unsigned j;
65
66 memcpy(bitmap, s->batch_notify_vqs, sizeof(bitmap));
67 memset(s->batch_notify_vqs, 0, sizeof(bitmap));
68
69 for (j = 0; j < nvqs; j += BITS_PER_LONG) {
70 unsigned long bits = bitmap[j / BITS_PER_LONG];
71
72 while (bits != 0) {
73 unsigned i = j + ctzl(bits);
74 VirtQueue *vq = virtio_get_queue(s->vdev, i);
75
76 virtio_notify_irqfd(s->vdev, vq);
77
78 bits &= bits - 1; /* clear right-most bit */
79 }
80 }
81 }
82
83 /* Context: QEMU global mutex held */
virtio_blk_data_plane_create(VirtIODevice * vdev,VirtIOBlkConf * conf,VirtIOBlockDataPlane ** dataplane,Error ** errp)84 bool virtio_blk_data_plane_create(VirtIODevice *vdev, VirtIOBlkConf *conf,
85 VirtIOBlockDataPlane **dataplane,
86 Error **errp)
87 {
88 VirtIOBlockDataPlane *s;
89 BusState *qbus = BUS(qdev_get_parent_bus(DEVICE(vdev)));
90 VirtioBusClass *k = VIRTIO_BUS_GET_CLASS(qbus);
91
92 *dataplane = NULL;
93
94 if (conf->iothread) {
95 if (!k->set_guest_notifiers || !k->ioeventfd_assign) {
96 error_setg(errp,
97 "device is incompatible with iothread "
98 "(transport does not support notifiers)");
99 return false;
100 }
101 if (!virtio_device_ioeventfd_enabled(vdev)) {
102 error_setg(errp, "ioeventfd is required for iothread");
103 return false;
104 }
105
106 /* If dataplane is (re-)enabled while the guest is running there could
107 * be block jobs that can conflict.
108 */
109 if (blk_op_is_blocked(conf->conf.blk, BLOCK_OP_TYPE_DATAPLANE, errp)) {
110 error_prepend(errp, "cannot start virtio-blk dataplane: ");
111 return false;
112 }
113 }
114 /* Don't try if transport does not support notifiers. */
115 if (!virtio_device_ioeventfd_enabled(vdev)) {
116 return false;
117 }
118
119 s = g_new0(VirtIOBlockDataPlane, 1);
120 s->vdev = vdev;
121 s->conf = conf;
122
123 if (conf->iothread) {
124 s->iothread = conf->iothread;
125 object_ref(OBJECT(s->iothread));
126 s->ctx = iothread_get_aio_context(s->iothread);
127 } else {
128 s->ctx = qemu_get_aio_context();
129 }
130 s->bh = aio_bh_new(s->ctx, notify_guest_bh, s);
131 s->batch_notify_vqs = bitmap_new(conf->num_queues);
132
133 *dataplane = s;
134
135 return true;
136 }
137
138 /* Context: QEMU global mutex held */
virtio_blk_data_plane_destroy(VirtIOBlockDataPlane * s)139 void virtio_blk_data_plane_destroy(VirtIOBlockDataPlane *s)
140 {
141 VirtIOBlock *vblk;
142
143 if (!s) {
144 return;
145 }
146
147 vblk = VIRTIO_BLK(s->vdev);
148 assert(!vblk->dataplane_started);
149 g_free(s->batch_notify_vqs);
150 qemu_bh_delete(s->bh);
151 if (s->iothread) {
152 object_unref(OBJECT(s->iothread));
153 }
154 g_free(s);
155 }
156
virtio_blk_data_plane_handle_output(VirtIODevice * vdev,VirtQueue * vq)157 static bool virtio_blk_data_plane_handle_output(VirtIODevice *vdev,
158 VirtQueue *vq)
159 {
160 VirtIOBlock *s = (VirtIOBlock *)vdev;
161
162 assert(s->dataplane);
163 assert(s->dataplane_started);
164
165 return virtio_blk_handle_vq(s, vq);
166 }
167
168 /* Context: QEMU global mutex held */
virtio_blk_data_plane_start(VirtIODevice * vdev)169 int virtio_blk_data_plane_start(VirtIODevice *vdev)
170 {
171 VirtIOBlock *vblk = VIRTIO_BLK(vdev);
172 VirtIOBlockDataPlane *s = vblk->dataplane;
173 BusState *qbus = BUS(qdev_get_parent_bus(DEVICE(vblk)));
174 VirtioBusClass *k = VIRTIO_BUS_GET_CLASS(qbus);
175 unsigned i;
176 unsigned nvqs = s->conf->num_queues;
177 Error *local_err = NULL;
178 int r;
179
180 if (vblk->dataplane_started || s->starting) {
181 return 0;
182 }
183
184 s->starting = true;
185
186 if (!virtio_vdev_has_feature(vdev, VIRTIO_RING_F_EVENT_IDX)) {
187 s->batch_notifications = true;
188 } else {
189 s->batch_notifications = false;
190 }
191
192 /* Set up guest notifier (irq) */
193 r = k->set_guest_notifiers(qbus->parent, nvqs, true);
194 if (r != 0) {
195 error_report("virtio-blk failed to set guest notifier (%d), "
196 "ensure -accel kvm is set.", r);
197 goto fail_guest_notifiers;
198 }
199
200 /* Set up virtqueue notify */
201 for (i = 0; i < nvqs; i++) {
202 r = virtio_bus_set_host_notifier(VIRTIO_BUS(qbus), i, true);
203 if (r != 0) {
204 fprintf(stderr, "virtio-blk failed to set host notifier (%d)\n", r);
205 while (i--) {
206 virtio_bus_set_host_notifier(VIRTIO_BUS(qbus), i, false);
207 virtio_bus_cleanup_host_notifier(VIRTIO_BUS(qbus), i);
208 }
209 goto fail_guest_notifiers;
210 }
211 }
212
213 s->starting = false;
214 vblk->dataplane_started = true;
215 trace_virtio_blk_data_plane_start(s);
216
217 r = blk_set_aio_context(s->conf->conf.blk, s->ctx, &local_err);
218 if (r < 0) {
219 error_report_err(local_err);
220 goto fail_guest_notifiers;
221 }
222
223 /* Kick right away to begin processing requests already in vring */
224 for (i = 0; i < nvqs; i++) {
225 VirtQueue *vq = virtio_get_queue(s->vdev, i);
226
227 event_notifier_set(virtio_queue_get_host_notifier(vq));
228 }
229
230 /* Get this show started by hooking up our callbacks */
231 aio_context_acquire(s->ctx);
232 for (i = 0; i < nvqs; i++) {
233 VirtQueue *vq = virtio_get_queue(s->vdev, i);
234
235 virtio_queue_aio_set_host_notifier_handler(vq, s->ctx,
236 virtio_blk_data_plane_handle_output);
237 }
238 aio_context_release(s->ctx);
239 return 0;
240
241 fail_guest_notifiers:
242 vblk->dataplane_disabled = true;
243 s->starting = false;
244 vblk->dataplane_started = true;
245 return -ENOSYS;
246 }
247
248 /* Stop notifications for new requests from guest.
249 *
250 * Context: BH in IOThread
251 */
virtio_blk_data_plane_stop_bh(void * opaque)252 static void virtio_blk_data_plane_stop_bh(void *opaque)
253 {
254 VirtIOBlockDataPlane *s = opaque;
255 unsigned i;
256
257 for (i = 0; i < s->conf->num_queues; i++) {
258 VirtQueue *vq = virtio_get_queue(s->vdev, i);
259
260 virtio_queue_aio_set_host_notifier_handler(vq, s->ctx, NULL);
261 }
262 }
263
264 /* Context: QEMU global mutex held */
virtio_blk_data_plane_stop(VirtIODevice * vdev)265 void virtio_blk_data_plane_stop(VirtIODevice *vdev)
266 {
267 VirtIOBlock *vblk = VIRTIO_BLK(vdev);
268 VirtIOBlockDataPlane *s = vblk->dataplane;
269 BusState *qbus = qdev_get_parent_bus(DEVICE(vblk));
270 VirtioBusClass *k = VIRTIO_BUS_GET_CLASS(qbus);
271 unsigned i;
272 unsigned nvqs = s->conf->num_queues;
273
274 if (!vblk->dataplane_started || s->stopping) {
275 return;
276 }
277
278 /* Better luck next time. */
279 if (vblk->dataplane_disabled) {
280 vblk->dataplane_disabled = false;
281 vblk->dataplane_started = false;
282 return;
283 }
284 s->stopping = true;
285 trace_virtio_blk_data_plane_stop(s);
286
287 aio_context_acquire(s->ctx);
288 aio_wait_bh_oneshot(s->ctx, virtio_blk_data_plane_stop_bh, s);
289
290 /* Drain and try to switch bs back to the QEMU main loop. If other users
291 * keep the BlockBackend in the iothread, that's ok */
292 blk_set_aio_context(s->conf->conf.blk, qemu_get_aio_context(), NULL);
293
294 aio_context_release(s->ctx);
295
296 for (i = 0; i < nvqs; i++) {
297 virtio_bus_set_host_notifier(VIRTIO_BUS(qbus), i, false);
298 virtio_bus_cleanup_host_notifier(VIRTIO_BUS(qbus), i);
299 }
300
301 qemu_bh_cancel(s->bh);
302 notify_guest_bh(s); /* final chance to notify guest */
303
304 /* Clean up guest notifier (irq) */
305 k->set_guest_notifiers(qbus->parent, nvqs, false);
306
307 vblk->dataplane_started = false;
308 s->stopping = false;
309 }
310