xref: /qemu/block/parallels.c (revision a94750d9)
1019d6b8fSAnthony Liguori /*
2019d6b8fSAnthony Liguori  * Block driver for Parallels disk image format
3019d6b8fSAnthony Liguori  *
4019d6b8fSAnthony Liguori  * Copyright (c) 2007 Alex Beregszaszi
5cc5690f2SDenis V. Lunev  * Copyright (c) 2015 Denis V. Lunev <den@openvz.org>
6019d6b8fSAnthony Liguori  *
7cc5690f2SDenis V. Lunev  * This code was originally based on comparing different disk images created
8cc5690f2SDenis V. Lunev  * by Parallels. Currently it is based on opened OpenVZ sources
9cc5690f2SDenis V. Lunev  * available at
10cc5690f2SDenis V. Lunev  *     http://git.openvz.org/?p=ploop;a=summary
11019d6b8fSAnthony Liguori  *
12019d6b8fSAnthony Liguori  * Permission is hereby granted, free of charge, to any person obtaining a copy
13019d6b8fSAnthony Liguori  * of this software and associated documentation files (the "Software"), to deal
14019d6b8fSAnthony Liguori  * in the Software without restriction, including without limitation the rights
15019d6b8fSAnthony Liguori  * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
16019d6b8fSAnthony Liguori  * copies of the Software, and to permit persons to whom the Software is
17019d6b8fSAnthony Liguori  * furnished to do so, subject to the following conditions:
18019d6b8fSAnthony Liguori  *
19019d6b8fSAnthony Liguori  * The above copyright notice and this permission notice shall be included in
20019d6b8fSAnthony Liguori  * all copies or substantial portions of the Software.
21019d6b8fSAnthony Liguori  *
22019d6b8fSAnthony Liguori  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
23019d6b8fSAnthony Liguori  * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
24019d6b8fSAnthony Liguori  * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
25019d6b8fSAnthony Liguori  * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
26019d6b8fSAnthony Liguori  * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
27019d6b8fSAnthony Liguori  * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
28019d6b8fSAnthony Liguori  * THE SOFTWARE.
29019d6b8fSAnthony Liguori  */
30922a01a0SMarkus Armbruster 
3180c71a24SPeter Maydell #include "qemu/osdep.h"
32baefd977SVladimir Sementsov-Ogievskiy #include "qemu/error-report.h"
33da34e65cSMarkus Armbruster #include "qapi/error.h"
34737e150eSPaolo Bonzini #include "block/block_int.h"
35609f45eaSMax Reitz #include "block/qdict.h"
368942764fSKevin Wolf #include "sysemu/block-backend.h"
371de7afc9SPaolo Bonzini #include "qemu/module.h"
38922a01a0SMarkus Armbruster #include "qemu/option.h"
391511b490SKevin Wolf #include "qapi/qmp/qdict.h"
401511b490SKevin Wolf #include "qapi/qobject-input-visitor.h"
411511b490SKevin Wolf #include "qapi/qapi-visit-block-core.h"
4258369e22SPaolo Bonzini #include "qemu/bswap.h"
430d31c7c2SDenis V. Lunev #include "qemu/bitmap.h"
441d0f37cfSJeff Cody #include "migration/blocker.h"
4590fe66f0SKlim Kireev #include "parallels.h"
46019d6b8fSAnthony Liguori 
47019d6b8fSAnthony Liguori /**************************************************************/
48019d6b8fSAnthony Liguori 
49019d6b8fSAnthony Liguori #define HEADER_MAGIC "WithoutFreeSpace"
50d25d5980SDenis V. Lunev #define HEADER_MAGIC2 "WithouFreSpacExt"
51019d6b8fSAnthony Liguori #define HEADER_VERSION 2
526dd6b9f1SDenis V. Lunev #define HEADER_INUSE_MAGIC  (0x746F6E59)
53555a608cSKlim Kireev #define MAX_PARALLELS_IMAGE_FACTOR (1ull << 32)
54019d6b8fSAnthony Liguori 
55f7abe0ecSMarc-André Lureau static QEnumLookup prealloc_mode_lookup = {
56f7abe0ecSMarc-André Lureau     .array = (const char *const[]) {
57d6179011SDenis V. Lunev         "falloc",
58d6179011SDenis V. Lunev         "truncate",
59f7abe0ecSMarc-André Lureau     },
60f7abe0ecSMarc-André Lureau     .size = PRL_PREALLOC_MODE__MAX
61d6179011SDenis V. Lunev };
62d6179011SDenis V. Lunev 
63d6179011SDenis V. Lunev #define PARALLELS_OPT_PREALLOC_MODE     "prealloc-mode"
64d6179011SDenis V. Lunev #define PARALLELS_OPT_PREALLOC_SIZE     "prealloc-size"
65d6179011SDenis V. Lunev 
66d6179011SDenis V. Lunev static QemuOptsList parallels_runtime_opts = {
67d6179011SDenis V. Lunev     .name = "parallels",
68d6179011SDenis V. Lunev     .head = QTAILQ_HEAD_INITIALIZER(parallels_runtime_opts.head),
69d6179011SDenis V. Lunev     .desc = {
70d6179011SDenis V. Lunev         {
71d6179011SDenis V. Lunev             .name = PARALLELS_OPT_PREALLOC_SIZE,
72d6179011SDenis V. Lunev             .type = QEMU_OPT_SIZE,
73d6179011SDenis V. Lunev             .help = "Preallocation size on image expansion",
74ff5bbe56SEdgar Kaziahmedov             .def_value_str = "128M",
75d6179011SDenis V. Lunev         },
76d6179011SDenis V. Lunev         {
77d6179011SDenis V. Lunev             .name = PARALLELS_OPT_PREALLOC_MODE,
78d6179011SDenis V. Lunev             .type = QEMU_OPT_STRING,
79d6179011SDenis V. Lunev             .help = "Preallocation mode on image expansion "
80d6179011SDenis V. Lunev                     "(allowed values: falloc, truncate)",
81d6179011SDenis V. Lunev             .def_value_str = "falloc",
82d6179011SDenis V. Lunev         },
83d6179011SDenis V. Lunev         { /* end of list */ },
84d6179011SDenis V. Lunev     },
85d6179011SDenis V. Lunev };
86d6179011SDenis V. Lunev 
871511b490SKevin Wolf static QemuOptsList parallels_create_opts = {
881511b490SKevin Wolf     .name = "parallels-create-opts",
891511b490SKevin Wolf     .head = QTAILQ_HEAD_INITIALIZER(parallels_create_opts.head),
901511b490SKevin Wolf     .desc = {
911511b490SKevin Wolf         {
921511b490SKevin Wolf             .name = BLOCK_OPT_SIZE,
931511b490SKevin Wolf             .type = QEMU_OPT_SIZE,
941511b490SKevin Wolf             .help = "Virtual disk size",
951511b490SKevin Wolf         },
961511b490SKevin Wolf         {
971511b490SKevin Wolf             .name = BLOCK_OPT_CLUSTER_SIZE,
981511b490SKevin Wolf             .type = QEMU_OPT_SIZE,
991511b490SKevin Wolf             .help = "Parallels image cluster size",
1001511b490SKevin Wolf             .def_value_str = stringify(DEFAULT_CLUSTER_SIZE),
1011511b490SKevin Wolf         },
1021511b490SKevin Wolf         { /* end of list */ }
1031511b490SKevin Wolf     }
1041511b490SKevin Wolf };
1051511b490SKevin Wolf 
106d6179011SDenis V. Lunev 
107555cc9d9SDenis V. Lunev static int64_t bat2sect(BDRVParallelsState *s, uint32_t idx)
108555cc9d9SDenis V. Lunev {
109dd97cdc0SDenis V. Lunev     return (uint64_t)le32_to_cpu(s->bat_bitmap[idx]) * s->off_multiplier;
110555cc9d9SDenis V. Lunev }
111555cc9d9SDenis V. Lunev 
1122d68e22eSDenis V. Lunev static uint32_t bat_entry_off(uint32_t idx)
1132d68e22eSDenis V. Lunev {
1142d68e22eSDenis V. Lunev     return sizeof(ParallelsHeader) + sizeof(uint32_t) * idx;
1152d68e22eSDenis V. Lunev }
1162d68e22eSDenis V. Lunev 
11729442569SRoman Kagan static int64_t seek_to_sector(BDRVParallelsState *s, int64_t sector_num)
118019d6b8fSAnthony Liguori {
119c34d2451SDavid Woodhouse     uint32_t index, offset;
120019d6b8fSAnthony Liguori 
121019d6b8fSAnthony Liguori     index = sector_num / s->tracks;
122019d6b8fSAnthony Liguori     offset = sector_num % s->tracks;
123019d6b8fSAnthony Liguori 
1249d8b88f6SChristoph Hellwig     /* not allocated */
125369f7de9SDenis V. Lunev     if ((index >= s->bat_size) || (s->bat_bitmap[index] == 0)) {
126019d6b8fSAnthony Liguori         return -1;
127369f7de9SDenis V. Lunev     }
128555cc9d9SDenis V. Lunev     return bat2sect(s, index) + offset;
129019d6b8fSAnthony Liguori }
130019d6b8fSAnthony Liguori 
1319de9da17SRoman Kagan static int cluster_remainder(BDRVParallelsState *s, int64_t sector_num,
1329de9da17SRoman Kagan         int nb_sectors)
1339de9da17SRoman Kagan {
1349de9da17SRoman Kagan     int ret = s->tracks - sector_num % s->tracks;
1359de9da17SRoman Kagan     return MIN(nb_sectors, ret);
1369de9da17SRoman Kagan }
1379de9da17SRoman Kagan 
1386953d920SDenis V. Lunev static int64_t block_status(BDRVParallelsState *s, int64_t sector_num,
1396953d920SDenis V. Lunev                             int nb_sectors, int *pnum)
1406953d920SDenis V. Lunev {
1416953d920SDenis V. Lunev     int64_t start_off = -2, prev_end_off = -2;
1426953d920SDenis V. Lunev 
1436953d920SDenis V. Lunev     *pnum = 0;
1446953d920SDenis V. Lunev     while (nb_sectors > 0 || start_off == -2) {
1456953d920SDenis V. Lunev         int64_t offset = seek_to_sector(s, sector_num);
1466953d920SDenis V. Lunev         int to_end;
1476953d920SDenis V. Lunev 
1486953d920SDenis V. Lunev         if (start_off == -2) {
1496953d920SDenis V. Lunev             start_off = offset;
1506953d920SDenis V. Lunev             prev_end_off = offset;
1516953d920SDenis V. Lunev         } else if (offset != prev_end_off) {
1526953d920SDenis V. Lunev             break;
1536953d920SDenis V. Lunev         }
1546953d920SDenis V. Lunev 
1556953d920SDenis V. Lunev         to_end = cluster_remainder(s, sector_num, nb_sectors);
1566953d920SDenis V. Lunev         nb_sectors -= to_end;
1576953d920SDenis V. Lunev         sector_num += to_end;
1586953d920SDenis V. Lunev         *pnum += to_end;
1596953d920SDenis V. Lunev 
1606953d920SDenis V. Lunev         if (offset > 0) {
1616953d920SDenis V. Lunev             prev_end_off += to_end;
1626953d920SDenis V. Lunev         }
1636953d920SDenis V. Lunev     }
1646953d920SDenis V. Lunev     return start_off;
1656953d920SDenis V. Lunev }
1666953d920SDenis V. Lunev 
167ddd2ef2cSDenis V. Lunev static int64_t allocate_clusters(BlockDriverState *bs, int64_t sector_num,
168ddd2ef2cSDenis V. Lunev                                  int nb_sectors, int *pnum)
1695a41e1faSDenis V. Lunev {
170bda4cdcbSEric Blake     int ret = 0;
1715a41e1faSDenis V. Lunev     BDRVParallelsState *s = bs->opaque;
172d8b83e37SDenis V. Lunev     int64_t pos, space, idx, to_allocate, i, len;
173ddd2ef2cSDenis V. Lunev 
174ddd2ef2cSDenis V. Lunev     pos = block_status(s, sector_num, nb_sectors, pnum);
175ddd2ef2cSDenis V. Lunev     if (pos > 0) {
176ddd2ef2cSDenis V. Lunev         return pos;
177ddd2ef2cSDenis V. Lunev     }
1785a41e1faSDenis V. Lunev 
1795a41e1faSDenis V. Lunev     idx = sector_num / s->tracks;
180969401feSLaurent Vivier     to_allocate = DIV_ROUND_UP(sector_num + *pnum, s->tracks) - idx;
18186d1bd70SMax Reitz 
18286d1bd70SMax Reitz     /* This function is called only by parallels_co_writev(), which will never
18386d1bd70SMax Reitz      * pass a sector_num at or beyond the end of the image (because the block
18486d1bd70SMax Reitz      * layer never passes such a sector_num to that function). Therefore, idx
18586d1bd70SMax Reitz      * is always below s->bat_size.
18686d1bd70SMax Reitz      * block_status() will limit *pnum so that sector_num + *pnum will not
18786d1bd70SMax Reitz      * exceed the image end. Therefore, idx + to_allocate cannot exceed
18886d1bd70SMax Reitz      * s->bat_size.
18986d1bd70SMax Reitz      * Note that s->bat_size is an unsigned int, therefore idx + to_allocate
19086d1bd70SMax Reitz      * will always fit into a uint32_t. */
19186d1bd70SMax Reitz     assert(idx < s->bat_size && idx + to_allocate <= s->bat_size);
19286d1bd70SMax Reitz 
193ddd2ef2cSDenis V. Lunev     space = to_allocate * s->tracks;
194d8b83e37SDenis V. Lunev     len = bdrv_getlength(bs->file->bs);
195d8b83e37SDenis V. Lunev     if (len < 0) {
196d8b83e37SDenis V. Lunev         return len;
197d8b83e37SDenis V. Lunev     }
198d8b83e37SDenis V. Lunev     if (s->data_end + space > (len >> BDRV_SECTOR_BITS)) {
199ddd2ef2cSDenis V. Lunev         space += s->prealloc_size;
200bda4cdcbSEric Blake         /*
201bda4cdcbSEric Blake          * We require the expanded size to read back as zero. If the
202bda4cdcbSEric Blake          * user permitted truncation, we try that; but if it fails, we
203bda4cdcbSEric Blake          * force the safer-but-slower fallocate.
204bda4cdcbSEric Blake          */
205bda4cdcbSEric Blake         if (s->prealloc_mode == PRL_PREALLOC_MODE_TRUNCATE) {
206bda4cdcbSEric Blake             ret = bdrv_truncate(bs->file,
207bda4cdcbSEric Blake                                 (s->data_end + space) << BDRV_SECTOR_BITS,
208bda4cdcbSEric Blake                                 false, PREALLOC_MODE_OFF, BDRV_REQ_ZERO_WRITE,
209bda4cdcbSEric Blake                                 NULL);
210bda4cdcbSEric Blake             if (ret == -ENOTSUP) {
211bda4cdcbSEric Blake                 s->prealloc_mode = PRL_PREALLOC_MODE_FALLOCATE;
212bda4cdcbSEric Blake             }
213bda4cdcbSEric Blake         }
21419f5dc15SDenis V. Lunev         if (s->prealloc_mode == PRL_PREALLOC_MODE_FALLOCATE) {
215720ff280SKevin Wolf             ret = bdrv_pwrite_zeroes(bs->file,
21674021bc4SEric Blake                                      s->data_end << BDRV_SECTOR_BITS,
21774021bc4SEric Blake                                      space << BDRV_SECTOR_BITS, 0);
2185a41e1faSDenis V. Lunev         }
2195a41e1faSDenis V. Lunev         if (ret < 0) {
2205a41e1faSDenis V. Lunev             return ret;
2215a41e1faSDenis V. Lunev         }
22219f5dc15SDenis V. Lunev     }
223ddd2ef2cSDenis V. Lunev 
224bcbb3866SEdgar Kaziakhmedov     /* Try to read from backing to fill empty clusters
225bcbb3866SEdgar Kaziakhmedov      * FIXME: 1. previous write_zeroes may be redundant
226bcbb3866SEdgar Kaziakhmedov      *        2. most of data we read from backing will be rewritten by
227bcbb3866SEdgar Kaziakhmedov      *           parallels_co_writev. On aligned-to-cluster write we do not need
228bcbb3866SEdgar Kaziakhmedov      *           this read at all.
229bcbb3866SEdgar Kaziakhmedov      *        3. it would be good to combine write of data from backing and new
230bcbb3866SEdgar Kaziakhmedov      *           data into one write call */
231bcbb3866SEdgar Kaziakhmedov     if (bs->backing) {
232bcbb3866SEdgar Kaziakhmedov         int64_t nb_cow_sectors = to_allocate * s->tracks;
233bcbb3866SEdgar Kaziakhmedov         int64_t nb_cow_bytes = nb_cow_sectors << BDRV_SECTOR_BITS;
234a4072543SVladimir Sementsov-Ogievskiy         void *buf = qemu_blockalign(bs, nb_cow_bytes);
235bcbb3866SEdgar Kaziakhmedov 
236a4072543SVladimir Sementsov-Ogievskiy         ret = bdrv_co_pread(bs->backing, idx * s->tracks * BDRV_SECTOR_SIZE,
237a4072543SVladimir Sementsov-Ogievskiy                             nb_cow_bytes, buf, 0);
238bcbb3866SEdgar Kaziakhmedov         if (ret < 0) {
239a4072543SVladimir Sementsov-Ogievskiy             qemu_vfree(buf);
240bcbb3866SEdgar Kaziakhmedov             return ret;
241bcbb3866SEdgar Kaziakhmedov         }
242bcbb3866SEdgar Kaziakhmedov 
243d08c2a24SEric Blake         ret = bdrv_co_pwritev(bs->file, s->data_end * BDRV_SECTOR_SIZE,
244a4072543SVladimir Sementsov-Ogievskiy                               nb_cow_bytes, buf, 0);
245a4072543SVladimir Sementsov-Ogievskiy         qemu_vfree(buf);
246bcbb3866SEdgar Kaziakhmedov         if (ret < 0) {
247bcbb3866SEdgar Kaziakhmedov             return ret;
248bcbb3866SEdgar Kaziakhmedov         }
249bcbb3866SEdgar Kaziakhmedov     }
250bcbb3866SEdgar Kaziakhmedov 
251ddd2ef2cSDenis V. Lunev     for (i = 0; i < to_allocate; i++) {
252ddd2ef2cSDenis V. Lunev         s->bat_bitmap[idx + i] = cpu_to_le32(s->data_end / s->off_multiplier);
25319f5dc15SDenis V. Lunev         s->data_end += s->tracks;
254ddd2ef2cSDenis V. Lunev         bitmap_set(s->bat_dirty_bmap,
255c9f6856dSVladimir Sementsov-Ogievskiy                    bat_entry_off(idx + i) / s->bat_dirty_block, 1);
256ddd2ef2cSDenis V. Lunev     }
2575a41e1faSDenis V. Lunev 
258ddd2ef2cSDenis V. Lunev     return bat2sect(s, idx) + sector_num % s->tracks;
2595a41e1faSDenis V. Lunev }
2605a41e1faSDenis V. Lunev 
2610d31c7c2SDenis V. Lunev 
2620d31c7c2SDenis V. Lunev static coroutine_fn int parallels_co_flush_to_os(BlockDriverState *bs)
2630d31c7c2SDenis V. Lunev {
2640d31c7c2SDenis V. Lunev     BDRVParallelsState *s = bs->opaque;
2650d31c7c2SDenis V. Lunev     unsigned long size = DIV_ROUND_UP(s->header_size, s->bat_dirty_block);
2660d31c7c2SDenis V. Lunev     unsigned long bit;
2670d31c7c2SDenis V. Lunev 
2680d31c7c2SDenis V. Lunev     qemu_co_mutex_lock(&s->lock);
2690d31c7c2SDenis V. Lunev 
2700d31c7c2SDenis V. Lunev     bit = find_first_bit(s->bat_dirty_bmap, size);
2710d31c7c2SDenis V. Lunev     while (bit < size) {
2720d31c7c2SDenis V. Lunev         uint32_t off = bit * s->bat_dirty_block;
2730d31c7c2SDenis V. Lunev         uint32_t to_write = s->bat_dirty_block;
2740d31c7c2SDenis V. Lunev         int ret;
2750d31c7c2SDenis V. Lunev 
2760d31c7c2SDenis V. Lunev         if (off + to_write > s->header_size) {
2770d31c7c2SDenis V. Lunev             to_write = s->header_size - off;
2780d31c7c2SDenis V. Lunev         }
279d9ca2ea2SKevin Wolf         ret = bdrv_pwrite(bs->file, off, (uint8_t *)s->header + off,
2809a4f4c31SKevin Wolf                           to_write);
2810d31c7c2SDenis V. Lunev         if (ret < 0) {
2820d31c7c2SDenis V. Lunev             qemu_co_mutex_unlock(&s->lock);
2830d31c7c2SDenis V. Lunev             return ret;
2840d31c7c2SDenis V. Lunev         }
2850d31c7c2SDenis V. Lunev         bit = find_next_bit(s->bat_dirty_bmap, size, bit + 1);
2860d31c7c2SDenis V. Lunev     }
2870d31c7c2SDenis V. Lunev     bitmap_zero(s->bat_dirty_bmap, size);
2880d31c7c2SDenis V. Lunev 
2890d31c7c2SDenis V. Lunev     qemu_co_mutex_unlock(&s->lock);
2900d31c7c2SDenis V. Lunev     return 0;
2910d31c7c2SDenis V. Lunev }
2920d31c7c2SDenis V. Lunev 
2930d31c7c2SDenis V. Lunev 
2948e0cf59dSEric Blake static int coroutine_fn parallels_co_block_status(BlockDriverState *bs,
2958e0cf59dSEric Blake                                                   bool want_zero,
2968e0cf59dSEric Blake                                                   int64_t offset,
2978e0cf59dSEric Blake                                                   int64_t bytes,
2988e0cf59dSEric Blake                                                   int64_t *pnum,
2998e0cf59dSEric Blake                                                   int64_t *map,
3008e0cf59dSEric Blake                                                   BlockDriverState **file)
301dd3bed16SRoman Kagan {
302dd3bed16SRoman Kagan     BDRVParallelsState *s = bs->opaque;
3038e0cf59dSEric Blake     int count;
304dd3bed16SRoman Kagan 
3058e0cf59dSEric Blake     assert(QEMU_IS_ALIGNED(offset | bytes, BDRV_SECTOR_SIZE));
306dd3bed16SRoman Kagan     qemu_co_mutex_lock(&s->lock);
3078e0cf59dSEric Blake     offset = block_status(s, offset >> BDRV_SECTOR_BITS,
3088e0cf59dSEric Blake                           bytes >> BDRV_SECTOR_BITS, &count);
309dd3bed16SRoman Kagan     qemu_co_mutex_unlock(&s->lock);
310dd3bed16SRoman Kagan 
3118e0cf59dSEric Blake     *pnum = count * BDRV_SECTOR_SIZE;
312dd3bed16SRoman Kagan     if (offset < 0) {
313dd3bed16SRoman Kagan         return 0;
314dd3bed16SRoman Kagan     }
315dd3bed16SRoman Kagan 
3168e0cf59dSEric Blake     *map = offset * BDRV_SECTOR_SIZE;
317ddf4987dSFam Zheng     *file = bs->file->bs;
3188e0cf59dSEric Blake     return BDRV_BLOCK_DATA | BDRV_BLOCK_OFFSET_VALID;
319dd3bed16SRoman Kagan }
320dd3bed16SRoman Kagan 
3215a41e1faSDenis V. Lunev static coroutine_fn int parallels_co_writev(BlockDriverState *bs,
322e18a58b4SEric Blake                                             int64_t sector_num, int nb_sectors,
323e18a58b4SEric Blake                                             QEMUIOVector *qiov, int flags)
3245a41e1faSDenis V. Lunev {
3255a41e1faSDenis V. Lunev     BDRVParallelsState *s = bs->opaque;
3265a41e1faSDenis V. Lunev     uint64_t bytes_done = 0;
3275a41e1faSDenis V. Lunev     QEMUIOVector hd_qiov;
3285a41e1faSDenis V. Lunev     int ret = 0;
3295a41e1faSDenis V. Lunev 
330e18a58b4SEric Blake     assert(!flags);
3315a41e1faSDenis V. Lunev     qemu_iovec_init(&hd_qiov, qiov->niov);
3325a41e1faSDenis V. Lunev 
3335a41e1faSDenis V. Lunev     while (nb_sectors > 0) {
3345a41e1faSDenis V. Lunev         int64_t position;
3355a41e1faSDenis V. Lunev         int n, nbytes;
3365a41e1faSDenis V. Lunev 
3375a41e1faSDenis V. Lunev         qemu_co_mutex_lock(&s->lock);
338ddd2ef2cSDenis V. Lunev         position = allocate_clusters(bs, sector_num, nb_sectors, &n);
3395a41e1faSDenis V. Lunev         qemu_co_mutex_unlock(&s->lock);
3405a41e1faSDenis V. Lunev         if (position < 0) {
3415a41e1faSDenis V. Lunev             ret = (int)position;
3425a41e1faSDenis V. Lunev             break;
3435a41e1faSDenis V. Lunev         }
3445a41e1faSDenis V. Lunev 
3455a41e1faSDenis V. Lunev         nbytes = n << BDRV_SECTOR_BITS;
3465a41e1faSDenis V. Lunev 
3475a41e1faSDenis V. Lunev         qemu_iovec_reset(&hd_qiov);
3485a41e1faSDenis V. Lunev         qemu_iovec_concat(&hd_qiov, qiov, bytes_done, nbytes);
3495a41e1faSDenis V. Lunev 
350d08c2a24SEric Blake         ret = bdrv_co_pwritev(bs->file, position * BDRV_SECTOR_SIZE, nbytes,
351d08c2a24SEric Blake                               &hd_qiov, 0);
3525a41e1faSDenis V. Lunev         if (ret < 0) {
3535a41e1faSDenis V. Lunev             break;
3545a41e1faSDenis V. Lunev         }
3555a41e1faSDenis V. Lunev 
3565a41e1faSDenis V. Lunev         nb_sectors -= n;
3575a41e1faSDenis V. Lunev         sector_num += n;
3585a41e1faSDenis V. Lunev         bytes_done += nbytes;
3595a41e1faSDenis V. Lunev     }
3605a41e1faSDenis V. Lunev 
3615a41e1faSDenis V. Lunev     qemu_iovec_destroy(&hd_qiov);
3625a41e1faSDenis V. Lunev     return ret;
3635a41e1faSDenis V. Lunev }
3645a41e1faSDenis V. Lunev 
365481fb9cfSDenis V. Lunev static coroutine_fn int parallels_co_readv(BlockDriverState *bs,
366481fb9cfSDenis V. Lunev         int64_t sector_num, int nb_sectors, QEMUIOVector *qiov)
367019d6b8fSAnthony Liguori {
36829442569SRoman Kagan     BDRVParallelsState *s = bs->opaque;
369481fb9cfSDenis V. Lunev     uint64_t bytes_done = 0;
370481fb9cfSDenis V. Lunev     QEMUIOVector hd_qiov;
371481fb9cfSDenis V. Lunev     int ret = 0;
372481fb9cfSDenis V. Lunev 
373481fb9cfSDenis V. Lunev     qemu_iovec_init(&hd_qiov, qiov->niov);
37429442569SRoman Kagan 
375019d6b8fSAnthony Liguori     while (nb_sectors > 0) {
376481fb9cfSDenis V. Lunev         int64_t position;
377481fb9cfSDenis V. Lunev         int n, nbytes;
378481fb9cfSDenis V. Lunev 
379481fb9cfSDenis V. Lunev         qemu_co_mutex_lock(&s->lock);
3806953d920SDenis V. Lunev         position = block_status(s, sector_num, nb_sectors, &n);
381481fb9cfSDenis V. Lunev         qemu_co_mutex_unlock(&s->lock);
382481fb9cfSDenis V. Lunev 
383481fb9cfSDenis V. Lunev         nbytes = n << BDRV_SECTOR_BITS;
384481fb9cfSDenis V. Lunev 
385481fb9cfSDenis V. Lunev         qemu_iovec_reset(&hd_qiov);
386481fb9cfSDenis V. Lunev         qemu_iovec_concat(&hd_qiov, qiov, bytes_done, nbytes);
387481fb9cfSDenis V. Lunev 
388bcbb3866SEdgar Kaziakhmedov         if (position < 0) {
389bcbb3866SEdgar Kaziakhmedov             if (bs->backing) {
390d08c2a24SEric Blake                 ret = bdrv_co_preadv(bs->backing, sector_num * BDRV_SECTOR_SIZE,
391d08c2a24SEric Blake                                      nbytes, &hd_qiov, 0);
392bcbb3866SEdgar Kaziakhmedov                 if (ret < 0) {
393bcbb3866SEdgar Kaziakhmedov                     break;
394bcbb3866SEdgar Kaziakhmedov                 }
395bcbb3866SEdgar Kaziakhmedov             } else {
396bcbb3866SEdgar Kaziakhmedov                 qemu_iovec_memset(&hd_qiov, 0, 0, nbytes);
397bcbb3866SEdgar Kaziakhmedov             }
398bcbb3866SEdgar Kaziakhmedov         } else {
399d08c2a24SEric Blake             ret = bdrv_co_preadv(bs->file, position * BDRV_SECTOR_SIZE, nbytes,
400d08c2a24SEric Blake                                  &hd_qiov, 0);
401481fb9cfSDenis V. Lunev             if (ret < 0) {
402481fb9cfSDenis V. Lunev                 break;
4039d8b88f6SChristoph Hellwig             }
404019d6b8fSAnthony Liguori         }
405019d6b8fSAnthony Liguori 
406481fb9cfSDenis V. Lunev         nb_sectors -= n;
407481fb9cfSDenis V. Lunev         sector_num += n;
408481fb9cfSDenis V. Lunev         bytes_done += nbytes;
409481fb9cfSDenis V. Lunev     }
410481fb9cfSDenis V. Lunev 
411481fb9cfSDenis V. Lunev     qemu_iovec_destroy(&hd_qiov);
4122914caa0SPaolo Bonzini     return ret;
4132914caa0SPaolo Bonzini }
4142914caa0SPaolo Bonzini 
41549ad6467SDenis V. Lunev 
4162fd61638SPaolo Bonzini static int coroutine_fn parallels_co_check(BlockDriverState *bs,
4172fd61638SPaolo Bonzini                                            BdrvCheckResult *res,
41849ad6467SDenis V. Lunev                                            BdrvCheckMode fix)
41949ad6467SDenis V. Lunev {
42049ad6467SDenis V. Lunev     BDRVParallelsState *s = bs->opaque;
42149ad6467SDenis V. Lunev     int64_t size, prev_off, high_off;
42249ad6467SDenis V. Lunev     int ret;
42349ad6467SDenis V. Lunev     uint32_t i;
42449ad6467SDenis V. Lunev     bool flush_bat = false;
42549ad6467SDenis V. Lunev 
4269a4f4c31SKevin Wolf     size = bdrv_getlength(bs->file->bs);
42749ad6467SDenis V. Lunev     if (size < 0) {
42849ad6467SDenis V. Lunev         res->check_errors++;
42949ad6467SDenis V. Lunev         return size;
43049ad6467SDenis V. Lunev     }
43149ad6467SDenis V. Lunev 
4322fd61638SPaolo Bonzini     qemu_co_mutex_lock(&s->lock);
4336dd6b9f1SDenis V. Lunev     if (s->header_unclean) {
4346dd6b9f1SDenis V. Lunev         fprintf(stderr, "%s image was not closed correctly\n",
4356dd6b9f1SDenis V. Lunev                 fix & BDRV_FIX_ERRORS ? "Repairing" : "ERROR");
4366dd6b9f1SDenis V. Lunev         res->corruptions++;
4376dd6b9f1SDenis V. Lunev         if (fix & BDRV_FIX_ERRORS) {
4386dd6b9f1SDenis V. Lunev             /* parallels_close will do the job right */
4396dd6b9f1SDenis V. Lunev             res->corruptions_fixed++;
4406dd6b9f1SDenis V. Lunev             s->header_unclean = false;
4416dd6b9f1SDenis V. Lunev         }
4426dd6b9f1SDenis V. Lunev     }
4436dd6b9f1SDenis V. Lunev 
44449ad6467SDenis V. Lunev     res->bfi.total_clusters = s->bat_size;
44549ad6467SDenis V. Lunev     res->bfi.compressed_clusters = 0; /* compression is not supported */
44649ad6467SDenis V. Lunev 
44749ad6467SDenis V. Lunev     high_off = 0;
44849ad6467SDenis V. Lunev     prev_off = 0;
44949ad6467SDenis V. Lunev     for (i = 0; i < s->bat_size; i++) {
45049ad6467SDenis V. Lunev         int64_t off = bat2sect(s, i) << BDRV_SECTOR_BITS;
45149ad6467SDenis V. Lunev         if (off == 0) {
45249ad6467SDenis V. Lunev             prev_off = 0;
45349ad6467SDenis V. Lunev             continue;
45449ad6467SDenis V. Lunev         }
45549ad6467SDenis V. Lunev 
45649ad6467SDenis V. Lunev         /* cluster outside the image */
45749ad6467SDenis V. Lunev         if (off > size) {
45849ad6467SDenis V. Lunev             fprintf(stderr, "%s cluster %u is outside image\n",
45949ad6467SDenis V. Lunev                     fix & BDRV_FIX_ERRORS ? "Repairing" : "ERROR", i);
46049ad6467SDenis V. Lunev             res->corruptions++;
46149ad6467SDenis V. Lunev             if (fix & BDRV_FIX_ERRORS) {
46249ad6467SDenis V. Lunev                 prev_off = 0;
46349ad6467SDenis V. Lunev                 s->bat_bitmap[i] = 0;
46449ad6467SDenis V. Lunev                 res->corruptions_fixed++;
46549ad6467SDenis V. Lunev                 flush_bat = true;
46649ad6467SDenis V. Lunev                 continue;
46749ad6467SDenis V. Lunev             }
46849ad6467SDenis V. Lunev         }
46949ad6467SDenis V. Lunev 
47049ad6467SDenis V. Lunev         res->bfi.allocated_clusters++;
47149ad6467SDenis V. Lunev         if (off > high_off) {
47249ad6467SDenis V. Lunev             high_off = off;
47349ad6467SDenis V. Lunev         }
47449ad6467SDenis V. Lunev 
475e0b5207fSVladimir Sementsov-Ogievskiy         if (prev_off != 0 && (prev_off + s->cluster_size) != off) {
47649ad6467SDenis V. Lunev             res->bfi.fragmented_clusters++;
47749ad6467SDenis V. Lunev         }
47849ad6467SDenis V. Lunev         prev_off = off;
47949ad6467SDenis V. Lunev     }
48049ad6467SDenis V. Lunev 
4812fd61638SPaolo Bonzini     ret = 0;
48249ad6467SDenis V. Lunev     if (flush_bat) {
483d9ca2ea2SKevin Wolf         ret = bdrv_pwrite_sync(bs->file, 0, s->header, s->header_size);
48449ad6467SDenis V. Lunev         if (ret < 0) {
48549ad6467SDenis V. Lunev             res->check_errors++;
4862fd61638SPaolo Bonzini             goto out;
48749ad6467SDenis V. Lunev         }
48849ad6467SDenis V. Lunev     }
48949ad6467SDenis V. Lunev 
490e0b5207fSVladimir Sementsov-Ogievskiy     res->image_end_offset = high_off + s->cluster_size;
49149ad6467SDenis V. Lunev     if (size > res->image_end_offset) {
49249ad6467SDenis V. Lunev         int64_t count;
493e0b5207fSVladimir Sementsov-Ogievskiy         count = DIV_ROUND_UP(size - res->image_end_offset, s->cluster_size);
49449ad6467SDenis V. Lunev         fprintf(stderr, "%s space leaked at the end of the image %" PRId64 "\n",
49549ad6467SDenis V. Lunev                 fix & BDRV_FIX_LEAKS ? "Repairing" : "ERROR",
49649ad6467SDenis V. Lunev                 size - res->image_end_offset);
49749ad6467SDenis V. Lunev         res->leaks += count;
49849ad6467SDenis V. Lunev         if (fix & BDRV_FIX_LEAKS) {
499ed3d2ec9SMax Reitz             Error *local_err = NULL;
500e8d04f92SMax Reitz 
501e8d04f92SMax Reitz             /*
502e8d04f92SMax Reitz              * In order to really repair the image, we must shrink it.
503e8d04f92SMax Reitz              * That means we have to pass exact=true.
504e8d04f92SMax Reitz              */
505e8d04f92SMax Reitz             ret = bdrv_truncate(bs->file, res->image_end_offset, true,
5067b8e4857SKevin Wolf                                 PREALLOC_MODE_OFF, 0, &local_err);
50749ad6467SDenis V. Lunev             if (ret < 0) {
508ed3d2ec9SMax Reitz                 error_report_err(local_err);
50949ad6467SDenis V. Lunev                 res->check_errors++;
5102fd61638SPaolo Bonzini                 goto out;
51149ad6467SDenis V. Lunev             }
51249ad6467SDenis V. Lunev             res->leaks_fixed += count;
51349ad6467SDenis V. Lunev         }
51449ad6467SDenis V. Lunev     }
51549ad6467SDenis V. Lunev 
5162fd61638SPaolo Bonzini out:
5172fd61638SPaolo Bonzini     qemu_co_mutex_unlock(&s->lock);
5182fd61638SPaolo Bonzini     return ret;
51949ad6467SDenis V. Lunev }
52049ad6467SDenis V. Lunev 
52149ad6467SDenis V. Lunev 
5221511b490SKevin Wolf static int coroutine_fn parallels_co_create(BlockdevCreateOptions* opts,
523efc75e2aSStefan Hajnoczi                                             Error **errp)
52474cf6c50SDenis V. Lunev {
5251511b490SKevin Wolf     BlockdevCreateOptionsParallels *parallels_opts;
5261511b490SKevin Wolf     BlockDriverState *bs;
5271511b490SKevin Wolf     BlockBackend *blk;
52874cf6c50SDenis V. Lunev     int64_t total_size, cl_size;
529369f7de9SDenis V. Lunev     uint32_t bat_entries, bat_sectors;
53074cf6c50SDenis V. Lunev     ParallelsHeader header;
5311511b490SKevin Wolf     uint8_t tmp[BDRV_SECTOR_SIZE];
53274cf6c50SDenis V. Lunev     int ret;
53374cf6c50SDenis V. Lunev 
5341511b490SKevin Wolf     assert(opts->driver == BLOCKDEV_DRIVER_PARALLELS);
5351511b490SKevin Wolf     parallels_opts = &opts->u.parallels;
5361511b490SKevin Wolf 
5371511b490SKevin Wolf     /* Sanity checks */
5381511b490SKevin Wolf     total_size = parallels_opts->size;
5391511b490SKevin Wolf 
5401511b490SKevin Wolf     if (parallels_opts->has_cluster_size) {
5411511b490SKevin Wolf         cl_size = parallels_opts->cluster_size;
5421511b490SKevin Wolf     } else {
5431511b490SKevin Wolf         cl_size = DEFAULT_CLUSTER_SIZE;
5441511b490SKevin Wolf     }
5451511b490SKevin Wolf 
5462332d825SKevin Wolf     /* XXX What is the real limit here? This is an insanely large maximum. */
5472332d825SKevin Wolf     if (cl_size >= INT64_MAX / MAX_PARALLELS_IMAGE_FACTOR) {
5482332d825SKevin Wolf         error_setg(errp, "Cluster size is too large");
5492332d825SKevin Wolf         return -EINVAL;
5502332d825SKevin Wolf     }
551555a608cSKlim Kireev     if (total_size >= MAX_PARALLELS_IMAGE_FACTOR * cl_size) {
5521511b490SKevin Wolf         error_setg(errp, "Image size is too large for this cluster size");
553555a608cSKlim Kireev         return -E2BIG;
554555a608cSKlim Kireev     }
55574cf6c50SDenis V. Lunev 
5561511b490SKevin Wolf     if (!QEMU_IS_ALIGNED(total_size, BDRV_SECTOR_SIZE)) {
5571511b490SKevin Wolf         error_setg(errp, "Image size must be a multiple of 512 bytes");
5581511b490SKevin Wolf         return -EINVAL;
55974cf6c50SDenis V. Lunev     }
56074cf6c50SDenis V. Lunev 
5611511b490SKevin Wolf     if (!QEMU_IS_ALIGNED(cl_size, BDRV_SECTOR_SIZE)) {
5621511b490SKevin Wolf         error_setg(errp, "Cluster size must be a multiple of 512 bytes");
5631511b490SKevin Wolf         return -EINVAL;
5641511b490SKevin Wolf     }
5651511b490SKevin Wolf 
5661511b490SKevin Wolf     /* Create BlockBackend to write to the image */
5671511b490SKevin Wolf     bs = bdrv_open_blockdev_ref(parallels_opts->file, errp);
5681511b490SKevin Wolf     if (bs == NULL) {
5698942764fSKevin Wolf         return -EIO;
57074cf6c50SDenis V. Lunev     }
5718942764fSKevin Wolf 
572a3aeeab5SEric Blake     blk = blk_new_with_bs(bs, BLK_PERM_WRITE | BLK_PERM_RESIZE, BLK_PERM_ALL,
573a3aeeab5SEric Blake                           errp);
574a3aeeab5SEric Blake     if (!blk) {
575a3aeeab5SEric Blake         ret = -EPERM;
5761511b490SKevin Wolf         goto out;
5771511b490SKevin Wolf     }
5781511b490SKevin Wolf     blk_set_allow_write_beyond_eof(blk, true);
5791511b490SKevin Wolf 
5801511b490SKevin Wolf     /* Create image format */
581369f7de9SDenis V. Lunev     bat_entries = DIV_ROUND_UP(total_size, cl_size);
5822d68e22eSDenis V. Lunev     bat_sectors = DIV_ROUND_UP(bat_entry_off(bat_entries), cl_size);
583369f7de9SDenis V. Lunev     bat_sectors = (bat_sectors *  cl_size) >> BDRV_SECTOR_BITS;
58474cf6c50SDenis V. Lunev 
58574cf6c50SDenis V. Lunev     memset(&header, 0, sizeof(header));
58674cf6c50SDenis V. Lunev     memcpy(header.magic, HEADER_MAGIC2, sizeof(header.magic));
58774cf6c50SDenis V. Lunev     header.version = cpu_to_le32(HEADER_VERSION);
58874cf6c50SDenis V. Lunev     /* don't care much about geometry, it is not used on image level */
589908b1c84SKlim Kireev     header.heads = cpu_to_le32(HEADS_NUMBER);
590908b1c84SKlim Kireev     header.cylinders = cpu_to_le32(total_size / BDRV_SECTOR_SIZE
591908b1c84SKlim Kireev                                    / HEADS_NUMBER / SEC_IN_CYL);
59274cf6c50SDenis V. Lunev     header.tracks = cpu_to_le32(cl_size >> BDRV_SECTOR_BITS);
593369f7de9SDenis V. Lunev     header.bat_entries = cpu_to_le32(bat_entries);
59474cf6c50SDenis V. Lunev     header.nb_sectors = cpu_to_le64(DIV_ROUND_UP(total_size, BDRV_SECTOR_SIZE));
595369f7de9SDenis V. Lunev     header.data_off = cpu_to_le32(bat_sectors);
59674cf6c50SDenis V. Lunev 
59774cf6c50SDenis V. Lunev     /* write all the data */
59874cf6c50SDenis V. Lunev     memset(tmp, 0, sizeof(tmp));
59974cf6c50SDenis V. Lunev     memcpy(tmp, &header, sizeof(header));
60074cf6c50SDenis V. Lunev 
6011511b490SKevin Wolf     ret = blk_pwrite(blk, 0, tmp, BDRV_SECTOR_SIZE, 0);
60274cf6c50SDenis V. Lunev     if (ret < 0) {
60374cf6c50SDenis V. Lunev         goto exit;
60474cf6c50SDenis V. Lunev     }
6051511b490SKevin Wolf     ret = blk_pwrite_zeroes(blk, BDRV_SECTOR_SIZE,
606983a1600SEric Blake                             (bat_sectors - 1) << BDRV_SECTOR_BITS, 0);
60774cf6c50SDenis V. Lunev     if (ret < 0) {
60874cf6c50SDenis V. Lunev         goto exit;
60974cf6c50SDenis V. Lunev     }
61074cf6c50SDenis V. Lunev 
6111511b490SKevin Wolf     ret = 0;
6121511b490SKevin Wolf out:
6131511b490SKevin Wolf     blk_unref(blk);
6141511b490SKevin Wolf     bdrv_unref(bs);
61574cf6c50SDenis V. Lunev     return ret;
61674cf6c50SDenis V. Lunev 
61774cf6c50SDenis V. Lunev exit:
61874cf6c50SDenis V. Lunev     error_setg_errno(errp, -ret, "Failed to create Parallels image");
6191511b490SKevin Wolf     goto out;
6201511b490SKevin Wolf }
6211511b490SKevin Wolf 
622b92902dfSMaxim Levitsky static int coroutine_fn parallels_co_create_opts(BlockDriver *drv,
623b92902dfSMaxim Levitsky                                                  const char *filename,
6241511b490SKevin Wolf                                                  QemuOpts *opts,
6251511b490SKevin Wolf                                                  Error **errp)
6261511b490SKevin Wolf {
6271511b490SKevin Wolf     BlockdevCreateOptions *create_options = NULL;
6281511b490SKevin Wolf     BlockDriverState *bs = NULL;
62992adf9dbSMarkus Armbruster     QDict *qdict;
6301511b490SKevin Wolf     Visitor *v;
6311511b490SKevin Wolf     int ret;
6321511b490SKevin Wolf 
6331511b490SKevin Wolf     static const QDictRenames opt_renames[] = {
6341511b490SKevin Wolf         { BLOCK_OPT_CLUSTER_SIZE,       "cluster-size" },
6351511b490SKevin Wolf         { NULL, NULL },
6361511b490SKevin Wolf     };
6371511b490SKevin Wolf 
6381511b490SKevin Wolf     /* Parse options and convert legacy syntax */
6391511b490SKevin Wolf     qdict = qemu_opts_to_qdict_filtered(opts, NULL, &parallels_create_opts,
6401511b490SKevin Wolf                                         true);
6411511b490SKevin Wolf 
6421511b490SKevin Wolf     if (!qdict_rename_keys(qdict, opt_renames, errp)) {
6431511b490SKevin Wolf         ret = -EINVAL;
64474cf6c50SDenis V. Lunev         goto done;
64574cf6c50SDenis V. Lunev     }
64674cf6c50SDenis V. Lunev 
6471511b490SKevin Wolf     /* Create and open the file (protocol layer) */
648668f62ecSMarkus Armbruster     ret = bdrv_create_file(filename, opts, errp);
6491511b490SKevin Wolf     if (ret < 0) {
6501511b490SKevin Wolf         goto done;
6511511b490SKevin Wolf     }
6521511b490SKevin Wolf 
6531511b490SKevin Wolf     bs = bdrv_open(filename, NULL, NULL,
6541511b490SKevin Wolf                    BDRV_O_RDWR | BDRV_O_RESIZE | BDRV_O_PROTOCOL, errp);
6551511b490SKevin Wolf     if (bs == NULL) {
6561511b490SKevin Wolf         ret = -EIO;
6571511b490SKevin Wolf         goto done;
6581511b490SKevin Wolf     }
6591511b490SKevin Wolf 
6601511b490SKevin Wolf     /* Now get the QAPI type BlockdevCreateOptions */
6611511b490SKevin Wolf     qdict_put_str(qdict, "driver", "parallels");
6621511b490SKevin Wolf     qdict_put_str(qdict, "file", bs->node_name);
6631511b490SKevin Wolf 
664af91062eSMarkus Armbruster     v = qobject_input_visitor_new_flat_confused(qdict, errp);
665af91062eSMarkus Armbruster     if (!v) {
6661511b490SKevin Wolf         ret = -EINVAL;
6671511b490SKevin Wolf         goto done;
6681511b490SKevin Wolf     }
6691511b490SKevin Wolf 
670b11a093cSMarkus Armbruster     visit_type_BlockdevCreateOptions(v, NULL, &create_options, errp);
6711511b490SKevin Wolf     visit_free(v);
672b11a093cSMarkus Armbruster     if (!create_options) {
6731511b490SKevin Wolf         ret = -EINVAL;
6741511b490SKevin Wolf         goto done;
6751511b490SKevin Wolf     }
6761511b490SKevin Wolf 
6771511b490SKevin Wolf     /* Silently round up sizes */
6781511b490SKevin Wolf     create_options->u.parallels.size =
6791511b490SKevin Wolf         ROUND_UP(create_options->u.parallels.size, BDRV_SECTOR_SIZE);
6801511b490SKevin Wolf     create_options->u.parallels.cluster_size =
6811511b490SKevin Wolf         ROUND_UP(create_options->u.parallels.cluster_size, BDRV_SECTOR_SIZE);
6821511b490SKevin Wolf 
6831511b490SKevin Wolf     /* Create the Parallels image (format layer) */
6841511b490SKevin Wolf     ret = parallels_co_create(create_options, errp);
6851511b490SKevin Wolf     if (ret < 0) {
6861511b490SKevin Wolf         goto done;
6871511b490SKevin Wolf     }
6881511b490SKevin Wolf     ret = 0;
6891511b490SKevin Wolf 
6901511b490SKevin Wolf done:
691cb3e7f08SMarc-André Lureau     qobject_unref(qdict);
6921511b490SKevin Wolf     bdrv_unref(bs);
6931511b490SKevin Wolf     qapi_free_BlockdevCreateOptions(create_options);
6941511b490SKevin Wolf     return ret;
6951511b490SKevin Wolf }
6961511b490SKevin Wolf 
69723d6bd3bSDenis V. Lunev 
69823d6bd3bSDenis V. Lunev static int parallels_probe(const uint8_t *buf, int buf_size,
69923d6bd3bSDenis V. Lunev                            const char *filename)
70023d6bd3bSDenis V. Lunev {
70123d6bd3bSDenis V. Lunev     const ParallelsHeader *ph = (const void *)buf;
70223d6bd3bSDenis V. Lunev 
70323d6bd3bSDenis V. Lunev     if (buf_size < sizeof(ParallelsHeader)) {
70423d6bd3bSDenis V. Lunev         return 0;
70523d6bd3bSDenis V. Lunev     }
70623d6bd3bSDenis V. Lunev 
70723d6bd3bSDenis V. Lunev     if ((!memcmp(ph->magic, HEADER_MAGIC, 16) ||
70823d6bd3bSDenis V. Lunev            !memcmp(ph->magic, HEADER_MAGIC2, 16)) &&
70923d6bd3bSDenis V. Lunev            (le32_to_cpu(ph->version) == HEADER_VERSION)) {
71023d6bd3bSDenis V. Lunev         return 100;
71123d6bd3bSDenis V. Lunev     }
71223d6bd3bSDenis V. Lunev 
71323d6bd3bSDenis V. Lunev     return 0;
71423d6bd3bSDenis V. Lunev }
71523d6bd3bSDenis V. Lunev 
7166dd6b9f1SDenis V. Lunev static int parallels_update_header(BlockDriverState *bs)
7176dd6b9f1SDenis V. Lunev {
7186dd6b9f1SDenis V. Lunev     BDRVParallelsState *s = bs->opaque;
7199a4f4c31SKevin Wolf     unsigned size = MAX(bdrv_opt_mem_align(bs->file->bs),
7209a4f4c31SKevin Wolf                         sizeof(ParallelsHeader));
7216dd6b9f1SDenis V. Lunev 
7226dd6b9f1SDenis V. Lunev     if (size > s->header_size) {
7236dd6b9f1SDenis V. Lunev         size = s->header_size;
7246dd6b9f1SDenis V. Lunev     }
725d9ca2ea2SKevin Wolf     return bdrv_pwrite_sync(bs->file, 0, s->header, size);
7266dd6b9f1SDenis V. Lunev }
7276dd6b9f1SDenis V. Lunev 
72823d6bd3bSDenis V. Lunev static int parallels_open(BlockDriverState *bs, QDict *options, int flags,
72923d6bd3bSDenis V. Lunev                           Error **errp)
73023d6bd3bSDenis V. Lunev {
73123d6bd3bSDenis V. Lunev     BDRVParallelsState *s = bs->opaque;
73223d6bd3bSDenis V. Lunev     ParallelsHeader ph;
73319f5dc15SDenis V. Lunev     int ret, size, i;
734d6179011SDenis V. Lunev     QemuOpts *opts = NULL;
735d6179011SDenis V. Lunev     Error *local_err = NULL;
736d6179011SDenis V. Lunev     char *buf;
73723d6bd3bSDenis V. Lunev 
7388b1869daSMax Reitz     bs->file = bdrv_open_child(NULL, options, "file", bs, &child_of_bds,
7398b1869daSMax Reitz                                BDRV_CHILD_IMAGE, false, errp);
7404e4bf5c4SKevin Wolf     if (!bs->file) {
7414e4bf5c4SKevin Wolf         return -EINVAL;
7424e4bf5c4SKevin Wolf     }
7434e4bf5c4SKevin Wolf 
744cf2ab8fcSKevin Wolf     ret = bdrv_pread(bs->file, 0, &ph, sizeof(ph));
74523d6bd3bSDenis V. Lunev     if (ret < 0) {
74623d6bd3bSDenis V. Lunev         goto fail;
74723d6bd3bSDenis V. Lunev     }
74823d6bd3bSDenis V. Lunev 
74923d6bd3bSDenis V. Lunev     bs->total_sectors = le64_to_cpu(ph.nb_sectors);
75023d6bd3bSDenis V. Lunev 
75123d6bd3bSDenis V. Lunev     if (le32_to_cpu(ph.version) != HEADER_VERSION) {
75223d6bd3bSDenis V. Lunev         goto fail_format;
75323d6bd3bSDenis V. Lunev     }
75423d6bd3bSDenis V. Lunev     if (!memcmp(ph.magic, HEADER_MAGIC, 16)) {
75523d6bd3bSDenis V. Lunev         s->off_multiplier = 1;
75623d6bd3bSDenis V. Lunev         bs->total_sectors = 0xffffffff & bs->total_sectors;
75723d6bd3bSDenis V. Lunev     } else if (!memcmp(ph.magic, HEADER_MAGIC2, 16)) {
75823d6bd3bSDenis V. Lunev         s->off_multiplier = le32_to_cpu(ph.tracks);
75923d6bd3bSDenis V. Lunev     } else {
76023d6bd3bSDenis V. Lunev         goto fail_format;
76123d6bd3bSDenis V. Lunev     }
76223d6bd3bSDenis V. Lunev 
76323d6bd3bSDenis V. Lunev     s->tracks = le32_to_cpu(ph.tracks);
76423d6bd3bSDenis V. Lunev     if (s->tracks == 0) {
76523d6bd3bSDenis V. Lunev         error_setg(errp, "Invalid image: Zero sectors per track");
76623d6bd3bSDenis V. Lunev         ret = -EINVAL;
76723d6bd3bSDenis V. Lunev         goto fail;
76823d6bd3bSDenis V. Lunev     }
76923d6bd3bSDenis V. Lunev     if (s->tracks > INT32_MAX/513) {
77023d6bd3bSDenis V. Lunev         error_setg(errp, "Invalid image: Too big cluster");
77123d6bd3bSDenis V. Lunev         ret = -EFBIG;
77223d6bd3bSDenis V. Lunev         goto fail;
77323d6bd3bSDenis V. Lunev     }
774e0b5207fSVladimir Sementsov-Ogievskiy     s->cluster_size = s->tracks << BDRV_SECTOR_BITS;
77523d6bd3bSDenis V. Lunev 
77623d6bd3bSDenis V. Lunev     s->bat_size = le32_to_cpu(ph.bat_entries);
77723d6bd3bSDenis V. Lunev     if (s->bat_size > INT_MAX / sizeof(uint32_t)) {
77823d6bd3bSDenis V. Lunev         error_setg(errp, "Catalog too large");
77923d6bd3bSDenis V. Lunev         ret = -EFBIG;
78023d6bd3bSDenis V. Lunev         goto fail;
78123d6bd3bSDenis V. Lunev     }
78223d6bd3bSDenis V. Lunev 
7832d68e22eSDenis V. Lunev     size = bat_entry_off(s->bat_size);
7849a4f4c31SKevin Wolf     s->header_size = ROUND_UP(size, bdrv_opt_mem_align(bs->file->bs));
7859a4f4c31SKevin Wolf     s->header = qemu_try_blockalign(bs->file->bs, s->header_size);
78623d6bd3bSDenis V. Lunev     if (s->header == NULL) {
78723d6bd3bSDenis V. Lunev         ret = -ENOMEM;
78823d6bd3bSDenis V. Lunev         goto fail;
78923d6bd3bSDenis V. Lunev     }
79019f5dc15SDenis V. Lunev     s->data_end = le32_to_cpu(ph.data_off);
79119f5dc15SDenis V. Lunev     if (s->data_end == 0) {
79219f5dc15SDenis V. Lunev         s->data_end = ROUND_UP(bat_entry_off(s->bat_size), BDRV_SECTOR_SIZE);
79319f5dc15SDenis V. Lunev     }
79419f5dc15SDenis V. Lunev     if (s->data_end < s->header_size) {
79523d6bd3bSDenis V. Lunev         /* there is not enough unused space to fit to block align between BAT
79623d6bd3bSDenis V. Lunev            and actual data. We can't avoid read-modify-write... */
79723d6bd3bSDenis V. Lunev         s->header_size = size;
79823d6bd3bSDenis V. Lunev     }
79923d6bd3bSDenis V. Lunev 
800cf2ab8fcSKevin Wolf     ret = bdrv_pread(bs->file, 0, s->header, s->header_size);
80123d6bd3bSDenis V. Lunev     if (ret < 0) {
80223d6bd3bSDenis V. Lunev         goto fail;
80323d6bd3bSDenis V. Lunev     }
80423d6bd3bSDenis V. Lunev     s->bat_bitmap = (uint32_t *)(s->header + 1);
80523d6bd3bSDenis V. Lunev 
80619f5dc15SDenis V. Lunev     for (i = 0; i < s->bat_size; i++) {
80719f5dc15SDenis V. Lunev         int64_t off = bat2sect(s, i);
80819f5dc15SDenis V. Lunev         if (off >= s->data_end) {
80919f5dc15SDenis V. Lunev             s->data_end = off + s->tracks;
81019f5dc15SDenis V. Lunev         }
81119f5dc15SDenis V. Lunev     }
81219f5dc15SDenis V. Lunev 
8136dd6b9f1SDenis V. Lunev     if (le32_to_cpu(ph.inuse) == HEADER_INUSE_MAGIC) {
8146dd6b9f1SDenis V. Lunev         /* Image was not closed correctly. The check is mandatory */
8156dd6b9f1SDenis V. Lunev         s->header_unclean = true;
8166dd6b9f1SDenis V. Lunev         if ((flags & BDRV_O_RDWR) && !(flags & BDRV_O_CHECK)) {
8176dd6b9f1SDenis V. Lunev             error_setg(errp, "parallels: Image was not closed correctly; "
8186dd6b9f1SDenis V. Lunev                        "cannot be opened read/write");
8196dd6b9f1SDenis V. Lunev             ret = -EACCES;
8206dd6b9f1SDenis V. Lunev             goto fail;
8216dd6b9f1SDenis V. Lunev         }
8226dd6b9f1SDenis V. Lunev     }
8236dd6b9f1SDenis V. Lunev 
824c6ecec43SMarkus Armbruster     opts = qemu_opts_create(&parallels_runtime_opts, NULL, 0, errp);
825c6ecec43SMarkus Armbruster     if (!opts) {
826d6179011SDenis V. Lunev         goto fail_options;
827d6179011SDenis V. Lunev     }
828d6179011SDenis V. Lunev 
829a5f9b9dfSMarkus Armbruster     if (!qemu_opts_absorb_qdict(opts, options, errp)) {
830d6179011SDenis V. Lunev         goto fail_options;
831d6179011SDenis V. Lunev     }
832d6179011SDenis V. Lunev 
833d6179011SDenis V. Lunev     s->prealloc_size =
834d6179011SDenis V. Lunev         qemu_opt_get_size_del(opts, PARALLELS_OPT_PREALLOC_SIZE, 0);
835d6179011SDenis V. Lunev     s->prealloc_size = MAX(s->tracks, s->prealloc_size >> BDRV_SECTOR_BITS);
836d6179011SDenis V. Lunev     buf = qemu_opt_get_del(opts, PARALLELS_OPT_PREALLOC_MODE);
837bda4cdcbSEric Blake     /* prealloc_mode can be downgraded later during allocate_clusters */
838f7abe0ecSMarc-André Lureau     s->prealloc_mode = qapi_enum_parse(&prealloc_mode_lookup, buf,
83906c60b6cSMarkus Armbruster                                        PRL_PREALLOC_MODE_FALLOCATE,
84006c60b6cSMarkus Armbruster                                        &local_err);
841d6179011SDenis V. Lunev     g_free(buf);
842d6179011SDenis V. Lunev     if (local_err != NULL) {
8434bc6d7eeSMarkus Armbruster         error_propagate(errp, local_err);
844d6179011SDenis V. Lunev         goto fail_options;
845d6179011SDenis V. Lunev     }
846dc62da88SDenis V. Lunev 
847baefd977SVladimir Sementsov-Ogievskiy     if (ph.ext_off) {
848baefd977SVladimir Sementsov-Ogievskiy         if (flags & BDRV_O_RDWR) {
849baefd977SVladimir Sementsov-Ogievskiy             /*
850baefd977SVladimir Sementsov-Ogievskiy              * It's unsafe to open image RW if there is an extension (as we
851baefd977SVladimir Sementsov-Ogievskiy              * don't support it). But parallels driver in QEMU historically
852baefd977SVladimir Sementsov-Ogievskiy              * ignores the extension, so print warning and don't care.
853baefd977SVladimir Sementsov-Ogievskiy              */
854baefd977SVladimir Sementsov-Ogievskiy             warn_report("Format Extension ignored in RW mode");
855baefd977SVladimir Sementsov-Ogievskiy         } else {
856baefd977SVladimir Sementsov-Ogievskiy             ret = parallels_read_format_extension(
857baefd977SVladimir Sementsov-Ogievskiy                     bs, le64_to_cpu(ph.ext_off) << BDRV_SECTOR_BITS, errp);
858baefd977SVladimir Sementsov-Ogievskiy             if (ret < 0) {
859baefd977SVladimir Sementsov-Ogievskiy                 goto fail;
860baefd977SVladimir Sementsov-Ogievskiy             }
861baefd977SVladimir Sementsov-Ogievskiy         }
862baefd977SVladimir Sementsov-Ogievskiy     }
863baefd977SVladimir Sementsov-Ogievskiy 
8646c7d390bSJeff Cody     if ((flags & BDRV_O_RDWR) && !(flags & BDRV_O_INACTIVE)) {
8656dd6b9f1SDenis V. Lunev         s->header->inuse = cpu_to_le32(HEADER_INUSE_MAGIC);
8666dd6b9f1SDenis V. Lunev         ret = parallels_update_header(bs);
8676dd6b9f1SDenis V. Lunev         if (ret < 0) {
8686dd6b9f1SDenis V. Lunev             goto fail;
8696dd6b9f1SDenis V. Lunev         }
8706dd6b9f1SDenis V. Lunev     }
8716dd6b9f1SDenis V. Lunev 
872038adc2fSWei Yang     s->bat_dirty_block = 4 * qemu_real_host_page_size;
8730d31c7c2SDenis V. Lunev     s->bat_dirty_bmap =
8740d31c7c2SDenis V. Lunev         bitmap_new(DIV_ROUND_UP(s->header_size, s->bat_dirty_block));
8750d31c7c2SDenis V. Lunev 
876*a94750d9SEmanuele Giuseppe Esposito     /* Disable migration until bdrv_activate method is added */
8771d0f37cfSJeff Cody     error_setg(&s->migration_blocker, "The Parallels format used by node '%s' "
8781d0f37cfSJeff Cody                "does not support live migration",
8791d0f37cfSJeff Cody                bdrv_get_device_or_node_name(bs));
880386f6c07SMarkus Armbruster     ret = migrate_add_blocker(s->migration_blocker, errp);
881386f6c07SMarkus Armbruster     if (ret < 0) {
8821d0f37cfSJeff Cody         error_free(s->migration_blocker);
8831d0f37cfSJeff Cody         goto fail;
8841d0f37cfSJeff Cody     }
88523d6bd3bSDenis V. Lunev     qemu_co_mutex_init(&s->lock);
88623d6bd3bSDenis V. Lunev     return 0;
88723d6bd3bSDenis V. Lunev 
88823d6bd3bSDenis V. Lunev fail_format:
88923d6bd3bSDenis V. Lunev     error_setg(errp, "Image not in Parallels format");
8904bc6d7eeSMarkus Armbruster fail_options:
89123d6bd3bSDenis V. Lunev     ret = -EINVAL;
89223d6bd3bSDenis V. Lunev fail:
89323d6bd3bSDenis V. Lunev     qemu_vfree(s->header);
89423d6bd3bSDenis V. Lunev     return ret;
89523d6bd3bSDenis V. Lunev }
89623d6bd3bSDenis V. Lunev 
89723d6bd3bSDenis V. Lunev 
898019d6b8fSAnthony Liguori static void parallels_close(BlockDriverState *bs)
899019d6b8fSAnthony Liguori {
900019d6b8fSAnthony Liguori     BDRVParallelsState *s = bs->opaque;
9016dd6b9f1SDenis V. Lunev 
9026c7d390bSJeff Cody     if ((bs->open_flags & BDRV_O_RDWR) && !(bs->open_flags & BDRV_O_INACTIVE)) {
9036dd6b9f1SDenis V. Lunev         s->header->inuse = 0;
9046dd6b9f1SDenis V. Lunev         parallels_update_header(bs);
905e8d04f92SMax Reitz 
906e8d04f92SMax Reitz         /* errors are ignored, so we might as well pass exact=true */
907e8d04f92SMax Reitz         bdrv_truncate(bs->file, s->data_end << BDRV_SECTOR_BITS, true,
9087b8e4857SKevin Wolf                       PREALLOC_MODE_OFF, 0, NULL);
90919f5dc15SDenis V. Lunev     }
91019f5dc15SDenis V. Lunev 
9110d31c7c2SDenis V. Lunev     g_free(s->bat_dirty_bmap);
9129eae9ccaSDenis V. Lunev     qemu_vfree(s->header);
9131d0f37cfSJeff Cody 
9141d0f37cfSJeff Cody     migrate_del_blocker(s->migration_blocker);
9151d0f37cfSJeff Cody     error_free(s->migration_blocker);
916019d6b8fSAnthony Liguori }
917019d6b8fSAnthony Liguori 
918019d6b8fSAnthony Liguori static BlockDriver bdrv_parallels = {
919019d6b8fSAnthony Liguori     .format_name	= "parallels",
920019d6b8fSAnthony Liguori     .instance_size	= sizeof(BDRVParallelsState),
921019d6b8fSAnthony Liguori     .bdrv_probe		= parallels_probe,
9221dec5a70SChristoph Hellwig     .bdrv_open		= parallels_open,
923019d6b8fSAnthony Liguori     .bdrv_close		= parallels_close,
92469dca43dSMax Reitz     .bdrv_child_perm          = bdrv_default_perms,
9258e0cf59dSEric Blake     .bdrv_co_block_status     = parallels_co_block_status,
926d0e61ce5SDenis V. Lunev     .bdrv_has_zero_init       = bdrv_has_zero_init_1,
9270d31c7c2SDenis V. Lunev     .bdrv_co_flush_to_os      = parallels_co_flush_to_os,
928481fb9cfSDenis V. Lunev     .bdrv_co_readv  = parallels_co_readv,
9295a41e1faSDenis V. Lunev     .bdrv_co_writev = parallels_co_writev,
930d67066d8SMax Reitz     .is_format      = true,
931bcbb3866SEdgar Kaziakhmedov     .supports_backing = true,
9321511b490SKevin Wolf     .bdrv_co_create      = parallels_co_create,
933efc75e2aSStefan Hajnoczi     .bdrv_co_create_opts = parallels_co_create_opts,
9342fd61638SPaolo Bonzini     .bdrv_co_check  = parallels_co_check,
93574cf6c50SDenis V. Lunev     .create_opts    = &parallels_create_opts,
936019d6b8fSAnthony Liguori };
937019d6b8fSAnthony Liguori 
938019d6b8fSAnthony Liguori static void bdrv_parallels_init(void)
939019d6b8fSAnthony Liguori {
940019d6b8fSAnthony Liguori     bdrv_register(&bdrv_parallels);
941019d6b8fSAnthony Liguori }
942019d6b8fSAnthony Liguori 
943019d6b8fSAnthony Liguori block_init(bdrv_parallels_init);
944