xref: /qemu/block/vdi.c (revision e9082e47)
19aebd98aSStefan Weil /*
29aebd98aSStefan Weil  * Block driver for the Virtual Disk Image (VDI) format
39aebd98aSStefan Weil  *
4641543b7SStefan Weil  * Copyright (c) 2009, 2012 Stefan Weil
59aebd98aSStefan Weil  *
69aebd98aSStefan Weil  * This program is free software: you can redistribute it and/or modify
79aebd98aSStefan Weil  * it under the terms of the GNU General Public License as published by
89aebd98aSStefan Weil  * the Free Software Foundation, either version 2 of the License, or
99aebd98aSStefan Weil  * (at your option) version 3 or any later version.
109aebd98aSStefan Weil  *
119aebd98aSStefan Weil  * This program is distributed in the hope that it will be useful,
129aebd98aSStefan Weil  * but WITHOUT ANY WARRANTY; without even the implied warranty of
139aebd98aSStefan Weil  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
149aebd98aSStefan Weil  * GNU General Public License for more details.
159aebd98aSStefan Weil  *
169aebd98aSStefan Weil  * You should have received a copy of the GNU General Public License
179aebd98aSStefan Weil  * along with this program.  If not, see <http://www.gnu.org/licenses/>.
189aebd98aSStefan Weil  *
199aebd98aSStefan Weil  * Reference:
209aebd98aSStefan Weil  * http://forums.virtualbox.org/viewtopic.php?t=8046
219aebd98aSStefan Weil  *
229aebd98aSStefan Weil  * This driver supports create / read / write operations on VDI images.
239aebd98aSStefan Weil  *
249aebd98aSStefan Weil  * Todo (see also TODO in code):
259aebd98aSStefan Weil  *
269aebd98aSStefan Weil  * Some features like snapshots are still missing.
279aebd98aSStefan Weil  *
289aebd98aSStefan Weil  * Deallocation of zero-filled blocks and shrinking images are missing, too
299aebd98aSStefan Weil  * (might be added to common block layer).
309aebd98aSStefan Weil  *
319aebd98aSStefan Weil  * Allocation of blocks could be optimized (less writes to block map and
329aebd98aSStefan Weil  * header).
339aebd98aSStefan Weil  *
34dc6fb73dSDeepak Kathayat  * Read and write of adjacent blocks could be done in one operation
359aebd98aSStefan Weil  * (current code uses one operation per block (1 MiB).
369aebd98aSStefan Weil  *
379aebd98aSStefan Weil  * The code is not thread safe (missing locks for changes in header and
389aebd98aSStefan Weil  * block table, no problem with current QEMU).
399aebd98aSStefan Weil  *
409aebd98aSStefan Weil  * Hints:
419aebd98aSStefan Weil  *
429aebd98aSStefan Weil  * Blocks (VDI documentation) correspond to clusters (QEMU).
439aebd98aSStefan Weil  * QEMU's backing files could be implemented using VDI snapshot files (TODO).
449aebd98aSStefan Weil  * VDI snapshot files may also contain the complete machine state.
459aebd98aSStefan Weil  * Maybe this machine state can be converted to QEMU PC machine snapshot data.
469aebd98aSStefan Weil  *
479aebd98aSStefan Weil  * The driver keeps a block cache (little endian entries) in memory.
489aebd98aSStefan Weil  * For the standard block size (1 MiB), a 1 TiB disk will use 4 MiB RAM,
499aebd98aSStefan Weil  * so this seems to be reasonable.
509aebd98aSStefan Weil  */
519aebd98aSStefan Weil 
529aebd98aSStefan Weil #include "qemu-common.h"
53737e150eSPaolo Bonzini #include "block/block_int.h"
541de7afc9SPaolo Bonzini #include "qemu/module.h"
55caf71f86SPaolo Bonzini #include "migration/migration.h"
569aebd98aSStefan Weil 
57ee682d27SStefan Weil #if defined(CONFIG_UUID)
589aebd98aSStefan Weil #include <uuid/uuid.h>
599aebd98aSStefan Weil #else
609aebd98aSStefan Weil /* TODO: move uuid emulation to some central place in QEMU. */
619c17d615SPaolo Bonzini #include "sysemu/sysemu.h"     /* UUID_FMT */
629aebd98aSStefan Weil typedef unsigned char uuid_t[16];
639aebd98aSStefan Weil #endif
649aebd98aSStefan Weil 
659aebd98aSStefan Weil /* Code configuration options. */
669aebd98aSStefan Weil 
679aebd98aSStefan Weil /* Enable debug messages. */
689aebd98aSStefan Weil //~ #define CONFIG_VDI_DEBUG
699aebd98aSStefan Weil 
709aebd98aSStefan Weil /* Support write operations on VDI images. */
719aebd98aSStefan Weil #define CONFIG_VDI_WRITE
729aebd98aSStefan Weil 
739aebd98aSStefan Weil /* Support non-standard block (cluster) size. This is untested.
749aebd98aSStefan Weil  * Maybe it will be needed for very large images.
759aebd98aSStefan Weil  */
769aebd98aSStefan Weil //~ #define CONFIG_VDI_BLOCK_SIZE
779aebd98aSStefan Weil 
789aebd98aSStefan Weil /* Support static (fixed, pre-allocated) images. */
799aebd98aSStefan Weil #define CONFIG_VDI_STATIC_IMAGE
809aebd98aSStefan Weil 
819aebd98aSStefan Weil /* Command line option for static images. */
829aebd98aSStefan Weil #define BLOCK_OPT_STATIC "static"
839aebd98aSStefan Weil 
849aebd98aSStefan Weil #define KiB     1024
859aebd98aSStefan Weil #define MiB     (KiB * KiB)
869aebd98aSStefan Weil 
879aebd98aSStefan Weil #define SECTOR_SIZE 512
8899cce9faSKevin Wolf #define DEFAULT_CLUSTER_SIZE (1 * MiB)
899aebd98aSStefan Weil 
909aebd98aSStefan Weil #if defined(CONFIG_VDI_DEBUG)
919aebd98aSStefan Weil #define logout(fmt, ...) \
929aebd98aSStefan Weil                 fprintf(stderr, "vdi\t%-24s" fmt, __func__, ##__VA_ARGS__)
939aebd98aSStefan Weil #else
949aebd98aSStefan Weil #define logout(fmt, ...) ((void)0)
959aebd98aSStefan Weil #endif
969aebd98aSStefan Weil 
979aebd98aSStefan Weil /* Image signature. */
989aebd98aSStefan Weil #define VDI_SIGNATURE 0xbeda107f
999aebd98aSStefan Weil 
1009aebd98aSStefan Weil /* Image version. */
1019aebd98aSStefan Weil #define VDI_VERSION_1_1 0x00010001
1029aebd98aSStefan Weil 
1039aebd98aSStefan Weil /* Image type. */
1049aebd98aSStefan Weil #define VDI_TYPE_DYNAMIC 1
1059aebd98aSStefan Weil #define VDI_TYPE_STATIC  2
1069aebd98aSStefan Weil 
1079aebd98aSStefan Weil /* Innotek / SUN images use these strings in header.text:
1089aebd98aSStefan Weil  * "<<< innotek VirtualBox Disk Image >>>\n"
1099aebd98aSStefan Weil  * "<<< Sun xVM VirtualBox Disk Image >>>\n"
1109aebd98aSStefan Weil  * "<<< Sun VirtualBox Disk Image >>>\n"
1119aebd98aSStefan Weil  * The value does not matter, so QEMU created images use a different text.
1129aebd98aSStefan Weil  */
1139aebd98aSStefan Weil #define VDI_TEXT "<<< QEMU VM Virtual Disk Image >>>\n"
1149aebd98aSStefan Weil 
115c794b4e0SEric Sunshine /* A never-allocated block; semantically arbitrary content. */
116c794b4e0SEric Sunshine #define VDI_UNALLOCATED 0xffffffffU
117c794b4e0SEric Sunshine 
118c794b4e0SEric Sunshine /* A discarded (no longer allocated) block; semantically zero-filled. */
119c794b4e0SEric Sunshine #define VDI_DISCARDED   0xfffffffeU
120c794b4e0SEric Sunshine 
121c794b4e0SEric Sunshine #define VDI_IS_ALLOCATED(X) ((X) < VDI_DISCARDED)
1229aebd98aSStefan Weil 
12363fa06dcSJeff Cody /* max blocks in image is (0xffffffff / 4) */
12463fa06dcSJeff Cody #define VDI_BLOCKS_IN_IMAGE_MAX  0x3fffffff
12563fa06dcSJeff Cody #define VDI_DISK_SIZE_MAX        ((uint64_t)VDI_BLOCKS_IN_IMAGE_MAX * \
12663fa06dcSJeff Cody                                   (uint64_t)DEFAULT_CLUSTER_SIZE)
12763fa06dcSJeff Cody 
128ee682d27SStefan Weil #if !defined(CONFIG_UUID)
1298ba2aae3SStefan Hajnoczi static inline void uuid_generate(uuid_t out)
1309aebd98aSStefan Weil {
1314f3669eaSStefan Weil     memset(out, 0, sizeof(uuid_t));
1329aebd98aSStefan Weil }
1339aebd98aSStefan Weil 
1348ba2aae3SStefan Hajnoczi static inline int uuid_is_null(const uuid_t uu)
1359aebd98aSStefan Weil {
1369aebd98aSStefan Weil     uuid_t null_uuid = { 0 };
1374f3669eaSStefan Weil     return memcmp(uu, null_uuid, sizeof(uuid_t)) == 0;
1389aebd98aSStefan Weil }
1399aebd98aSStefan Weil 
1408ba2aae3SStefan Hajnoczi static inline void uuid_unparse(const uuid_t uu, char *out)
1419aebd98aSStefan Weil {
1429aebd98aSStefan Weil     snprintf(out, 37, UUID_FMT,
1439aebd98aSStefan Weil             uu[0], uu[1], uu[2], uu[3], uu[4], uu[5], uu[6], uu[7],
1449aebd98aSStefan Weil             uu[8], uu[9], uu[10], uu[11], uu[12], uu[13], uu[14], uu[15]);
1459aebd98aSStefan Weil }
1469aebd98aSStefan Weil #endif
1479aebd98aSStefan Weil 
1489aebd98aSStefan Weil typedef struct {
1499aebd98aSStefan Weil     char text[0x40];
1509aebd98aSStefan Weil     uint32_t signature;
1519aebd98aSStefan Weil     uint32_t version;
1529aebd98aSStefan Weil     uint32_t header_size;
1539aebd98aSStefan Weil     uint32_t image_type;
1549aebd98aSStefan Weil     uint32_t image_flags;
1559aebd98aSStefan Weil     char description[256];
1569aebd98aSStefan Weil     uint32_t offset_bmap;
1579aebd98aSStefan Weil     uint32_t offset_data;
1589aebd98aSStefan Weil     uint32_t cylinders;         /* disk geometry, unused here */
1599aebd98aSStefan Weil     uint32_t heads;             /* disk geometry, unused here */
1609aebd98aSStefan Weil     uint32_t sectors;           /* disk geometry, unused here */
1619aebd98aSStefan Weil     uint32_t sector_size;
1629aebd98aSStefan Weil     uint32_t unused1;
1639aebd98aSStefan Weil     uint64_t disk_size;
1649aebd98aSStefan Weil     uint32_t block_size;
1659aebd98aSStefan Weil     uint32_t block_extra;       /* unused here */
1669aebd98aSStefan Weil     uint32_t blocks_in_image;
1679aebd98aSStefan Weil     uint32_t blocks_allocated;
1689aebd98aSStefan Weil     uuid_t uuid_image;
1699aebd98aSStefan Weil     uuid_t uuid_last_snap;
1709aebd98aSStefan Weil     uuid_t uuid_link;
1719aebd98aSStefan Weil     uuid_t uuid_parent;
1729aebd98aSStefan Weil     uint64_t unused2[7];
1738368febdSJeff Cody } QEMU_PACKED VdiHeader;
1749aebd98aSStefan Weil 
1759aebd98aSStefan Weil typedef struct {
1769aebd98aSStefan Weil     /* The block map entries are little endian (even in memory). */
1779aebd98aSStefan Weil     uint32_t *bmap;
1789aebd98aSStefan Weil     /* Size of block (bytes). */
1799aebd98aSStefan Weil     uint32_t block_size;
1809aebd98aSStefan Weil     /* Size of block (sectors). */
1819aebd98aSStefan Weil     uint32_t block_sectors;
1829aebd98aSStefan Weil     /* First sector of block map. */
1839aebd98aSStefan Weil     uint32_t bmap_sector;
1844ff9786cSStefan Weil     /* VDI header (converted to host endianness). */
1859aebd98aSStefan Weil     VdiHeader header;
186fc9d106cSKevin Wolf 
187fc9d106cSKevin Wolf     Error *migration_blocker;
1889aebd98aSStefan Weil } BDRVVdiState;
1899aebd98aSStefan Weil 
1909aebd98aSStefan Weil /* Change UUID from little endian (IPRT = VirtualBox format) to big endian
1919aebd98aSStefan Weil  * format (network byte order, standard, see RFC 4122) and vice versa.
1929aebd98aSStefan Weil  */
1939aebd98aSStefan Weil static void uuid_convert(uuid_t uuid)
1949aebd98aSStefan Weil {
1959aebd98aSStefan Weil     bswap32s((uint32_t *)&uuid[0]);
1969aebd98aSStefan Weil     bswap16s((uint16_t *)&uuid[4]);
1979aebd98aSStefan Weil     bswap16s((uint16_t *)&uuid[6]);
1989aebd98aSStefan Weil }
1999aebd98aSStefan Weil 
2009aebd98aSStefan Weil static void vdi_header_to_cpu(VdiHeader *header)
2019aebd98aSStefan Weil {
2029aebd98aSStefan Weil     le32_to_cpus(&header->signature);
2039aebd98aSStefan Weil     le32_to_cpus(&header->version);
2049aebd98aSStefan Weil     le32_to_cpus(&header->header_size);
2059aebd98aSStefan Weil     le32_to_cpus(&header->image_type);
2069aebd98aSStefan Weil     le32_to_cpus(&header->image_flags);
2079aebd98aSStefan Weil     le32_to_cpus(&header->offset_bmap);
2089aebd98aSStefan Weil     le32_to_cpus(&header->offset_data);
2099aebd98aSStefan Weil     le32_to_cpus(&header->cylinders);
2109aebd98aSStefan Weil     le32_to_cpus(&header->heads);
2119aebd98aSStefan Weil     le32_to_cpus(&header->sectors);
2129aebd98aSStefan Weil     le32_to_cpus(&header->sector_size);
2139aebd98aSStefan Weil     le64_to_cpus(&header->disk_size);
2149aebd98aSStefan Weil     le32_to_cpus(&header->block_size);
2159aebd98aSStefan Weil     le32_to_cpus(&header->block_extra);
2169aebd98aSStefan Weil     le32_to_cpus(&header->blocks_in_image);
2179aebd98aSStefan Weil     le32_to_cpus(&header->blocks_allocated);
2189aebd98aSStefan Weil     uuid_convert(header->uuid_image);
2199aebd98aSStefan Weil     uuid_convert(header->uuid_last_snap);
2209aebd98aSStefan Weil     uuid_convert(header->uuid_link);
2219aebd98aSStefan Weil     uuid_convert(header->uuid_parent);
2229aebd98aSStefan Weil }
2239aebd98aSStefan Weil 
2249aebd98aSStefan Weil static void vdi_header_to_le(VdiHeader *header)
2259aebd98aSStefan Weil {
2269aebd98aSStefan Weil     cpu_to_le32s(&header->signature);
2279aebd98aSStefan Weil     cpu_to_le32s(&header->version);
2289aebd98aSStefan Weil     cpu_to_le32s(&header->header_size);
2299aebd98aSStefan Weil     cpu_to_le32s(&header->image_type);
2309aebd98aSStefan Weil     cpu_to_le32s(&header->image_flags);
2319aebd98aSStefan Weil     cpu_to_le32s(&header->offset_bmap);
2329aebd98aSStefan Weil     cpu_to_le32s(&header->offset_data);
2339aebd98aSStefan Weil     cpu_to_le32s(&header->cylinders);
2349aebd98aSStefan Weil     cpu_to_le32s(&header->heads);
2359aebd98aSStefan Weil     cpu_to_le32s(&header->sectors);
2369aebd98aSStefan Weil     cpu_to_le32s(&header->sector_size);
2379aebd98aSStefan Weil     cpu_to_le64s(&header->disk_size);
2389aebd98aSStefan Weil     cpu_to_le32s(&header->block_size);
2399aebd98aSStefan Weil     cpu_to_le32s(&header->block_extra);
2409aebd98aSStefan Weil     cpu_to_le32s(&header->blocks_in_image);
2419aebd98aSStefan Weil     cpu_to_le32s(&header->blocks_allocated);
2429aebd98aSStefan Weil     uuid_convert(header->uuid_image);
2439aebd98aSStefan Weil     uuid_convert(header->uuid_last_snap);
2449aebd98aSStefan Weil     uuid_convert(header->uuid_link);
2459aebd98aSStefan Weil     uuid_convert(header->uuid_parent);
2469aebd98aSStefan Weil }
2479aebd98aSStefan Weil 
2489aebd98aSStefan Weil #if defined(CONFIG_VDI_DEBUG)
2499aebd98aSStefan Weil static void vdi_header_print(VdiHeader *header)
2509aebd98aSStefan Weil {
2519aebd98aSStefan Weil     char uuid[37];
2529aebd98aSStefan Weil     logout("text        %s", header->text);
2539f0470bbSStefan Weil     logout("signature   0x%08x\n", header->signature);
2549aebd98aSStefan Weil     logout("header size 0x%04x\n", header->header_size);
2559aebd98aSStefan Weil     logout("image type  0x%04x\n", header->image_type);
2569aebd98aSStefan Weil     logout("image flags 0x%04x\n", header->image_flags);
2579aebd98aSStefan Weil     logout("description %s\n", header->description);
2589aebd98aSStefan Weil     logout("offset bmap 0x%04x\n", header->offset_bmap);
2599aebd98aSStefan Weil     logout("offset data 0x%04x\n", header->offset_data);
2609aebd98aSStefan Weil     logout("cylinders   0x%04x\n", header->cylinders);
2619aebd98aSStefan Weil     logout("heads       0x%04x\n", header->heads);
2629aebd98aSStefan Weil     logout("sectors     0x%04x\n", header->sectors);
2639aebd98aSStefan Weil     logout("sector size 0x%04x\n", header->sector_size);
2649aebd98aSStefan Weil     logout("image size  0x%" PRIx64 " B (%" PRIu64 " MiB)\n",
2659aebd98aSStefan Weil            header->disk_size, header->disk_size / MiB);
2669aebd98aSStefan Weil     logout("block size  0x%04x\n", header->block_size);
2679aebd98aSStefan Weil     logout("block extra 0x%04x\n", header->block_extra);
2689aebd98aSStefan Weil     logout("blocks tot. 0x%04x\n", header->blocks_in_image);
2699aebd98aSStefan Weil     logout("blocks all. 0x%04x\n", header->blocks_allocated);
2709aebd98aSStefan Weil     uuid_unparse(header->uuid_image, uuid);
2719aebd98aSStefan Weil     logout("uuid image  %s\n", uuid);
2729aebd98aSStefan Weil     uuid_unparse(header->uuid_last_snap, uuid);
2739aebd98aSStefan Weil     logout("uuid snap   %s\n", uuid);
2749aebd98aSStefan Weil     uuid_unparse(header->uuid_link, uuid);
2759aebd98aSStefan Weil     logout("uuid link   %s\n", uuid);
2769aebd98aSStefan Weil     uuid_unparse(header->uuid_parent, uuid);
2779aebd98aSStefan Weil     logout("uuid parent %s\n", uuid);
2789aebd98aSStefan Weil }
2799aebd98aSStefan Weil #endif
2809aebd98aSStefan Weil 
2814534ff54SKevin Wolf static int vdi_check(BlockDriverState *bs, BdrvCheckResult *res,
2824534ff54SKevin Wolf                      BdrvCheckMode fix)
2839aebd98aSStefan Weil {
2849aebd98aSStefan Weil     /* TODO: additional checks possible. */
2859aebd98aSStefan Weil     BDRVVdiState *s = (BDRVVdiState *)bs->opaque;
2869aebd98aSStefan Weil     uint32_t blocks_allocated = 0;
2879aebd98aSStefan Weil     uint32_t block;
2889aebd98aSStefan Weil     uint32_t *bmap;
2899aebd98aSStefan Weil     logout("\n");
2909aebd98aSStefan Weil 
2914534ff54SKevin Wolf     if (fix) {
2924534ff54SKevin Wolf         return -ENOTSUP;
2934534ff54SKevin Wolf     }
2944534ff54SKevin Wolf 
2955839e53bSMarkus Armbruster     bmap = g_try_new(uint32_t, s->header.blocks_in_image);
29617cce735SKevin Wolf     if (s->header.blocks_in_image && bmap == NULL) {
29717cce735SKevin Wolf         res->check_errors++;
29817cce735SKevin Wolf         return -ENOMEM;
29917cce735SKevin Wolf     }
30017cce735SKevin Wolf 
3019aebd98aSStefan Weil     memset(bmap, 0xff, s->header.blocks_in_image * sizeof(uint32_t));
3029aebd98aSStefan Weil 
3039aebd98aSStefan Weil     /* Check block map and value of blocks_allocated. */
3049aebd98aSStefan Weil     for (block = 0; block < s->header.blocks_in_image; block++) {
3059aebd98aSStefan Weil         uint32_t bmap_entry = le32_to_cpu(s->bmap[block]);
306c794b4e0SEric Sunshine         if (VDI_IS_ALLOCATED(bmap_entry)) {
3079aebd98aSStefan Weil             if (bmap_entry < s->header.blocks_in_image) {
3089aebd98aSStefan Weil                 blocks_allocated++;
309c794b4e0SEric Sunshine                 if (!VDI_IS_ALLOCATED(bmap[bmap_entry])) {
3109aebd98aSStefan Weil                     bmap[bmap_entry] = bmap_entry;
3119aebd98aSStefan Weil                 } else {
3129aebd98aSStefan Weil                     fprintf(stderr, "ERROR: block index %" PRIu32
3139aebd98aSStefan Weil                             " also used by %" PRIu32 "\n", bmap[bmap_entry], bmap_entry);
3149ac228e0SKevin Wolf                     res->corruptions++;
3159aebd98aSStefan Weil                 }
3169aebd98aSStefan Weil             } else {
3179aebd98aSStefan Weil                 fprintf(stderr, "ERROR: block index %" PRIu32
3189aebd98aSStefan Weil                         " too large, is %" PRIu32 "\n", block, bmap_entry);
3199ac228e0SKevin Wolf                 res->corruptions++;
3209aebd98aSStefan Weil             }
3219aebd98aSStefan Weil         }
3229aebd98aSStefan Weil     }
3239aebd98aSStefan Weil     if (blocks_allocated != s->header.blocks_allocated) {
3249aebd98aSStefan Weil         fprintf(stderr, "ERROR: allocated blocks mismatch, is %" PRIu32
3259aebd98aSStefan Weil                ", should be %" PRIu32 "\n",
3269aebd98aSStefan Weil                blocks_allocated, s->header.blocks_allocated);
3279ac228e0SKevin Wolf         res->corruptions++;
3289aebd98aSStefan Weil     }
3299aebd98aSStefan Weil 
3307267c094SAnthony Liguori     g_free(bmap);
3319aebd98aSStefan Weil 
3329ac228e0SKevin Wolf     return 0;
3339aebd98aSStefan Weil }
3349aebd98aSStefan Weil 
3359aebd98aSStefan Weil static int vdi_get_info(BlockDriverState *bs, BlockDriverInfo *bdi)
3369aebd98aSStefan Weil {
3379aebd98aSStefan Weil     /* TODO: vdi_get_info would be needed for machine snapshots.
3389aebd98aSStefan Weil        vm_state_offset is still missing. */
3399aebd98aSStefan Weil     BDRVVdiState *s = (BDRVVdiState *)bs->opaque;
3409aebd98aSStefan Weil     logout("\n");
3419aebd98aSStefan Weil     bdi->cluster_size = s->block_size;
3429aebd98aSStefan Weil     bdi->vm_state_offset = 0;
34395de6d70SPaolo Bonzini     bdi->unallocated_blocks_are_zero = true;
3449aebd98aSStefan Weil     return 0;
3459aebd98aSStefan Weil }
3469aebd98aSStefan Weil 
3479aebd98aSStefan Weil static int vdi_make_empty(BlockDriverState *bs)
3489aebd98aSStefan Weil {
3499aebd98aSStefan Weil     /* TODO: missing code. */
3509aebd98aSStefan Weil     logout("\n");
3519aebd98aSStefan Weil     /* The return value for missing code must be 0, see block.c. */
3529aebd98aSStefan Weil     return 0;
3539aebd98aSStefan Weil }
3549aebd98aSStefan Weil 
3559aebd98aSStefan Weil static int vdi_probe(const uint8_t *buf, int buf_size, const char *filename)
3569aebd98aSStefan Weil {
3579aebd98aSStefan Weil     const VdiHeader *header = (const VdiHeader *)buf;
358dddc7750SJeff Cody     int ret = 0;
3599aebd98aSStefan Weil 
3609aebd98aSStefan Weil     logout("\n");
3619aebd98aSStefan Weil 
3629aebd98aSStefan Weil     if (buf_size < sizeof(*header)) {
3639aebd98aSStefan Weil         /* Header too small, no VDI. */
3649aebd98aSStefan Weil     } else if (le32_to_cpu(header->signature) == VDI_SIGNATURE) {
365dddc7750SJeff Cody         ret = 100;
3669aebd98aSStefan Weil     }
3679aebd98aSStefan Weil 
368dddc7750SJeff Cody     if (ret == 0) {
3699aebd98aSStefan Weil         logout("no vdi image\n");
3709aebd98aSStefan Weil     } else {
3719aebd98aSStefan Weil         logout("%s", header->text);
3729aebd98aSStefan Weil     }
3739aebd98aSStefan Weil 
374dddc7750SJeff Cody     return ret;
3759aebd98aSStefan Weil }
3769aebd98aSStefan Weil 
377015a1036SMax Reitz static int vdi_open(BlockDriverState *bs, QDict *options, int flags,
378015a1036SMax Reitz                     Error **errp)
3799aebd98aSStefan Weil {
3809aebd98aSStefan Weil     BDRVVdiState *s = bs->opaque;
3819aebd98aSStefan Weil     VdiHeader header;
3829aebd98aSStefan Weil     size_t bmap_size;
3838937f822SStefan Weil     int ret;
3849aebd98aSStefan Weil 
3859aebd98aSStefan Weil     logout("\n");
3869aebd98aSStefan Weil 
3878937f822SStefan Weil     ret = bdrv_read(bs->file, 0, (uint8_t *)&header, 1);
3888937f822SStefan Weil     if (ret < 0) {
3899aebd98aSStefan Weil         goto fail;
3909aebd98aSStefan Weil     }
3919aebd98aSStefan Weil 
3929aebd98aSStefan Weil     vdi_header_to_cpu(&header);
3939aebd98aSStefan Weil #if defined(CONFIG_VDI_DEBUG)
3949aebd98aSStefan Weil     vdi_header_print(&header);
3959aebd98aSStefan Weil #endif
3969aebd98aSStefan Weil 
39763fa06dcSJeff Cody     if (header.disk_size > VDI_DISK_SIZE_MAX) {
39863fa06dcSJeff Cody         error_setg(errp, "Unsupported VDI image size (size is 0x%" PRIx64
39963fa06dcSJeff Cody                           ", max supported is 0x%" PRIx64 ")",
40063fa06dcSJeff Cody                           header.disk_size, VDI_DISK_SIZE_MAX);
40163fa06dcSJeff Cody         ret = -ENOTSUP;
40263fa06dcSJeff Cody         goto fail;
40363fa06dcSJeff Cody     }
40463fa06dcSJeff Cody 
405f21dc3a4SStefan Weil     if (header.disk_size % SECTOR_SIZE != 0) {
406f21dc3a4SStefan Weil         /* 'VBoxManage convertfromraw' can create images with odd disk sizes.
407f21dc3a4SStefan Weil            We accept them but round the disk size to the next multiple of
408f21dc3a4SStefan Weil            SECTOR_SIZE. */
409f21dc3a4SStefan Weil         logout("odd disk size %" PRIu64 " B, round up\n", header.disk_size);
410*e9082e47SMax Reitz         header.disk_size = ROUND_UP(header.disk_size, SECTOR_SIZE);
411f21dc3a4SStefan Weil     }
412f21dc3a4SStefan Weil 
4130e87ba2cSStefan Weil     if (header.signature != VDI_SIGNATURE) {
414521b2b5dSMax Reitz         error_setg(errp, "Image not in VDI format (bad signature %08" PRIx32
415521b2b5dSMax Reitz                    ")", header.signature);
41676abe407SPaolo Bonzini         ret = -EINVAL;
4170e87ba2cSStefan Weil         goto fail;
4180e87ba2cSStefan Weil     } else if (header.version != VDI_VERSION_1_1) {
419521b2b5dSMax Reitz         error_setg(errp, "unsupported VDI image (version %" PRIu32 ".%" PRIu32
420521b2b5dSMax Reitz                    ")", header.version >> 16, header.version & 0xffff);
4218937f822SStefan Weil         ret = -ENOTSUP;
4229aebd98aSStefan Weil         goto fail;
4239aebd98aSStefan Weil     } else if (header.offset_bmap % SECTOR_SIZE != 0) {
4249aebd98aSStefan Weil         /* We only support block maps which start on a sector boundary. */
4255b7aa9b5SPaolo Bonzini         error_setg(errp, "unsupported VDI image (unaligned block map offset "
426521b2b5dSMax Reitz                    "0x%" PRIx32 ")", header.offset_bmap);
4278937f822SStefan Weil         ret = -ENOTSUP;
4289aebd98aSStefan Weil         goto fail;
4299aebd98aSStefan Weil     } else if (header.offset_data % SECTOR_SIZE != 0) {
4309aebd98aSStefan Weil         /* We only support data blocks which start on a sector boundary. */
431521b2b5dSMax Reitz         error_setg(errp, "unsupported VDI image (unaligned data offset 0x%"
432521b2b5dSMax Reitz                    PRIx32 ")", header.offset_data);
4338937f822SStefan Weil         ret = -ENOTSUP;
4349aebd98aSStefan Weil         goto fail;
4359aebd98aSStefan Weil     } else if (header.sector_size != SECTOR_SIZE) {
436521b2b5dSMax Reitz         error_setg(errp, "unsupported VDI image (sector size %" PRIu32
437521b2b5dSMax Reitz                    " is not %u)", header.sector_size, SECTOR_SIZE);
4388937f822SStefan Weil         ret = -ENOTSUP;
4399aebd98aSStefan Weil         goto fail;
44063fa06dcSJeff Cody     } else if (header.block_size != DEFAULT_CLUSTER_SIZE) {
441521b2b5dSMax Reitz         error_setg(errp, "unsupported VDI image (block size %" PRIu32
442521b2b5dSMax Reitz                    " is not %u)", header.block_size, DEFAULT_CLUSTER_SIZE);
4438937f822SStefan Weil         ret = -ENOTSUP;
4449aebd98aSStefan Weil         goto fail;
445f21dc3a4SStefan Weil     } else if (header.disk_size >
446f21dc3a4SStefan Weil                (uint64_t)header.blocks_in_image * header.block_size) {
4475b7aa9b5SPaolo Bonzini         error_setg(errp, "unsupported VDI image (disk size %" PRIu64 ", "
4485b7aa9b5SPaolo Bonzini                    "image bitmap has room for %" PRIu64 ")",
4495b7aa9b5SPaolo Bonzini                    header.disk_size,
4505b7aa9b5SPaolo Bonzini                    (uint64_t)header.blocks_in_image * header.block_size);
4518937f822SStefan Weil         ret = -ENOTSUP;
4529aebd98aSStefan Weil         goto fail;
4539aebd98aSStefan Weil     } else if (!uuid_is_null(header.uuid_link)) {
4545b7aa9b5SPaolo Bonzini         error_setg(errp, "unsupported VDI image (non-NULL link UUID)");
4558937f822SStefan Weil         ret = -ENOTSUP;
4569aebd98aSStefan Weil         goto fail;
4579aebd98aSStefan Weil     } else if (!uuid_is_null(header.uuid_parent)) {
4585b7aa9b5SPaolo Bonzini         error_setg(errp, "unsupported VDI image (non-NULL parent UUID)");
4598937f822SStefan Weil         ret = -ENOTSUP;
4609aebd98aSStefan Weil         goto fail;
46163fa06dcSJeff Cody     } else if (header.blocks_in_image > VDI_BLOCKS_IN_IMAGE_MAX) {
46263fa06dcSJeff Cody         error_setg(errp, "unsupported VDI image "
46363fa06dcSJeff Cody                          "(too many blocks %u, max is %u)",
46463fa06dcSJeff Cody                           header.blocks_in_image, VDI_BLOCKS_IN_IMAGE_MAX);
46563fa06dcSJeff Cody         ret = -ENOTSUP;
46663fa06dcSJeff Cody         goto fail;
4679aebd98aSStefan Weil     }
4689aebd98aSStefan Weil 
4699aebd98aSStefan Weil     bs->total_sectors = header.disk_size / SECTOR_SIZE;
4709aebd98aSStefan Weil 
4719aebd98aSStefan Weil     s->block_size = header.block_size;
4729aebd98aSStefan Weil     s->block_sectors = header.block_size / SECTOR_SIZE;
4739aebd98aSStefan Weil     s->bmap_sector = header.offset_bmap / SECTOR_SIZE;
4749aebd98aSStefan Weil     s->header = header;
4759aebd98aSStefan Weil 
4769aebd98aSStefan Weil     bmap_size = header.blocks_in_image * sizeof(uint32_t);
477*e9082e47SMax Reitz     bmap_size = DIV_ROUND_UP(bmap_size, SECTOR_SIZE);
47817cce735SKevin Wolf     s->bmap = qemu_try_blockalign(bs->file, bmap_size * SECTOR_SIZE);
47917cce735SKevin Wolf     if (s->bmap == NULL) {
48017cce735SKevin Wolf         ret = -ENOMEM;
48117cce735SKevin Wolf         goto fail;
48217cce735SKevin Wolf     }
48317cce735SKevin Wolf 
4848937f822SStefan Weil     ret = bdrv_read(bs->file, s->bmap_sector, (uint8_t *)s->bmap, bmap_size);
4858937f822SStefan Weil     if (ret < 0) {
4869aebd98aSStefan Weil         goto fail_free_bmap;
4879aebd98aSStefan Weil     }
4889aebd98aSStefan Weil 
489fc9d106cSKevin Wolf     /* Disable migration when vdi images are used */
490fc9d106cSKevin Wolf     error_set(&s->migration_blocker,
491fc9d106cSKevin Wolf               QERR_BLOCK_FORMAT_FEATURE_NOT_SUPPORTED,
492bfb197e0SMarkus Armbruster               "vdi", bdrv_get_device_name(bs), "live migration");
493fc9d106cSKevin Wolf     migrate_add_blocker(s->migration_blocker);
494fc9d106cSKevin Wolf 
4959aebd98aSStefan Weil     return 0;
4969aebd98aSStefan Weil 
4979aebd98aSStefan Weil  fail_free_bmap:
49817cce735SKevin Wolf     qemu_vfree(s->bmap);
4999aebd98aSStefan Weil 
5009aebd98aSStefan Weil  fail:
5018937f822SStefan Weil     return ret;
5029aebd98aSStefan Weil }
5039aebd98aSStefan Weil 
504ecfe2bbaSJeff Cody static int vdi_reopen_prepare(BDRVReopenState *state,
505ecfe2bbaSJeff Cody                               BlockReopenQueue *queue, Error **errp)
506ecfe2bbaSJeff Cody {
507ecfe2bbaSJeff Cody     return 0;
508ecfe2bbaSJeff Cody }
509ecfe2bbaSJeff Cody 
510b6b8a333SPaolo Bonzini static int64_t coroutine_fn vdi_co_get_block_status(BlockDriverState *bs,
511e850b35aSStefan Hajnoczi         int64_t sector_num, int nb_sectors, int *pnum)
5129aebd98aSStefan Weil {
5139aebd98aSStefan Weil     /* TODO: Check for too large sector_num (in bdrv_is_allocated or here). */
5149aebd98aSStefan Weil     BDRVVdiState *s = (BDRVVdiState *)bs->opaque;
5159aebd98aSStefan Weil     size_t bmap_index = sector_num / s->block_sectors;
5169aebd98aSStefan Weil     size_t sector_in_block = sector_num % s->block_sectors;
5179aebd98aSStefan Weil     int n_sectors = s->block_sectors - sector_in_block;
5189aebd98aSStefan Weil     uint32_t bmap_entry = le32_to_cpu(s->bmap[bmap_index]);
5194bc74be9SPaolo Bonzini     uint64_t offset;
5204bc74be9SPaolo Bonzini     int result;
5214bc74be9SPaolo Bonzini 
5229aebd98aSStefan Weil     logout("%p, %" PRId64 ", %d, %p\n", bs, sector_num, nb_sectors, pnum);
5239aebd98aSStefan Weil     if (n_sectors > nb_sectors) {
5249aebd98aSStefan Weil         n_sectors = nb_sectors;
5259aebd98aSStefan Weil     }
5269aebd98aSStefan Weil     *pnum = n_sectors;
5274bc74be9SPaolo Bonzini     result = VDI_IS_ALLOCATED(bmap_entry);
5284bc74be9SPaolo Bonzini     if (!result) {
5294bc74be9SPaolo Bonzini         return 0;
5304bc74be9SPaolo Bonzini     }
5314bc74be9SPaolo Bonzini 
5324bc74be9SPaolo Bonzini     offset = s->header.offset_data +
5334bc74be9SPaolo Bonzini                               (uint64_t)bmap_entry * s->block_size +
5344bc74be9SPaolo Bonzini                               sector_in_block * SECTOR_SIZE;
5354bc74be9SPaolo Bonzini     return BDRV_BLOCK_DATA | BDRV_BLOCK_OFFSET_VALID | offset;
5369aebd98aSStefan Weil }
5379aebd98aSStefan Weil 
538a7a43aa1SPaolo Bonzini static int vdi_co_read(BlockDriverState *bs,
539a7a43aa1SPaolo Bonzini         int64_t sector_num, uint8_t *buf, int nb_sectors)
5409aebd98aSStefan Weil {
5419aebd98aSStefan Weil     BDRVVdiState *s = bs->opaque;
5429aebd98aSStefan Weil     uint32_t bmap_entry;
5439aebd98aSStefan Weil     uint32_t block_index;
5449aebd98aSStefan Weil     uint32_t sector_in_block;
5459aebd98aSStefan Weil     uint32_t n_sectors;
546eb9566d1SPaolo Bonzini     int ret = 0;
5474de659e8SPaolo Bonzini 
5484de659e8SPaolo Bonzini     logout("\n");
5499aebd98aSStefan Weil 
550eb9566d1SPaolo Bonzini     while (ret >= 0 && nb_sectors > 0) {
551bfc45fc1SPaolo Bonzini         block_index = sector_num / s->block_sectors;
552bfc45fc1SPaolo Bonzini         sector_in_block = sector_num % s->block_sectors;
5539aebd98aSStefan Weil         n_sectors = s->block_sectors - sector_in_block;
554bfc45fc1SPaolo Bonzini         if (n_sectors > nb_sectors) {
555bfc45fc1SPaolo Bonzini             n_sectors = nb_sectors;
5569aebd98aSStefan Weil         }
5579aebd98aSStefan Weil 
5589aebd98aSStefan Weil         logout("will read %u sectors starting at sector %" PRIu64 "\n",
559bfc45fc1SPaolo Bonzini                n_sectors, sector_num);
5609aebd98aSStefan Weil 
5619aebd98aSStefan Weil         /* prepare next AIO request */
5629aebd98aSStefan Weil         bmap_entry = le32_to_cpu(s->bmap[block_index]);
563c794b4e0SEric Sunshine         if (!VDI_IS_ALLOCATED(bmap_entry)) {
5649aebd98aSStefan Weil             /* Block not allocated, return zeros, no need to wait. */
565a7a43aa1SPaolo Bonzini             memset(buf, 0, n_sectors * SECTOR_SIZE);
5663d46a75aSPaolo Bonzini             ret = 0;
5679aebd98aSStefan Weil         } else {
5689aebd98aSStefan Weil             uint64_t offset = s->header.offset_data / SECTOR_SIZE +
5699aebd98aSStefan Weil                               (uint64_t)bmap_entry * s->block_sectors +
5709aebd98aSStefan Weil                               sector_in_block;
5714eea78e6SPaolo Bonzini             ret = bdrv_read(bs->file, offset, buf, n_sectors);
5729aebd98aSStefan Weil         }
573bfc45fc1SPaolo Bonzini         logout("%u sectors read\n", n_sectors);
5740c7bfc32SPaolo Bonzini 
575bfc45fc1SPaolo Bonzini         nb_sectors -= n_sectors;
576bfc45fc1SPaolo Bonzini         sector_num += n_sectors;
577a7a43aa1SPaolo Bonzini         buf += n_sectors * SECTOR_SIZE;
5783d46a75aSPaolo Bonzini     }
5793d46a75aSPaolo Bonzini 
5803d46a75aSPaolo Bonzini     return ret;
5819aebd98aSStefan Weil }
5829aebd98aSStefan Weil 
583a7a43aa1SPaolo Bonzini static int vdi_co_write(BlockDriverState *bs,
584a7a43aa1SPaolo Bonzini         int64_t sector_num, const uint8_t *buf, int nb_sectors)
5859aebd98aSStefan Weil {
5869aebd98aSStefan Weil     BDRVVdiState *s = bs->opaque;
5879aebd98aSStefan Weil     uint32_t bmap_entry;
5889aebd98aSStefan Weil     uint32_t block_index;
5899aebd98aSStefan Weil     uint32_t sector_in_block;
5909aebd98aSStefan Weil     uint32_t n_sectors;
591bfc45fc1SPaolo Bonzini     uint32_t bmap_first = VDI_UNALLOCATED;
592bfc45fc1SPaolo Bonzini     uint32_t bmap_last = VDI_UNALLOCATED;
593bfc45fc1SPaolo Bonzini     uint8_t *block = NULL;
594eb9566d1SPaolo Bonzini     int ret = 0;
5954de659e8SPaolo Bonzini 
5964de659e8SPaolo Bonzini     logout("\n");
5979aebd98aSStefan Weil 
598eb9566d1SPaolo Bonzini     while (ret >= 0 && nb_sectors > 0) {
599bfc45fc1SPaolo Bonzini         block_index = sector_num / s->block_sectors;
600bfc45fc1SPaolo Bonzini         sector_in_block = sector_num % s->block_sectors;
6019aebd98aSStefan Weil         n_sectors = s->block_sectors - sector_in_block;
602bfc45fc1SPaolo Bonzini         if (n_sectors > nb_sectors) {
603bfc45fc1SPaolo Bonzini             n_sectors = nb_sectors;
6049aebd98aSStefan Weil         }
6059aebd98aSStefan Weil 
6069aebd98aSStefan Weil         logout("will write %u sectors starting at sector %" PRIu64 "\n",
607bfc45fc1SPaolo Bonzini                n_sectors, sector_num);
6089aebd98aSStefan Weil 
6099aebd98aSStefan Weil         /* prepare next AIO request */
6109aebd98aSStefan Weil         bmap_entry = le32_to_cpu(s->bmap[block_index]);
611c794b4e0SEric Sunshine         if (!VDI_IS_ALLOCATED(bmap_entry)) {
6129aebd98aSStefan Weil             /* Allocate new block and write to it. */
6139aebd98aSStefan Weil             uint64_t offset;
6149aebd98aSStefan Weil             bmap_entry = s->header.blocks_allocated;
6159aebd98aSStefan Weil             s->bmap[block_index] = cpu_to_le32(bmap_entry);
6169aebd98aSStefan Weil             s->header.blocks_allocated++;
6179aebd98aSStefan Weil             offset = s->header.offset_data / SECTOR_SIZE +
6189aebd98aSStefan Weil                      (uint64_t)bmap_entry * s->block_sectors;
6199aebd98aSStefan Weil             if (block == NULL) {
620641543b7SStefan Weil                 block = g_malloc(s->block_size);
621bfc45fc1SPaolo Bonzini                 bmap_first = block_index;
6229aebd98aSStefan Weil             }
623bfc45fc1SPaolo Bonzini             bmap_last = block_index;
624641543b7SStefan Weil             /* Copy data to be written to new block and zero unused parts. */
625641543b7SStefan Weil             memset(block, 0, sector_in_block * SECTOR_SIZE);
6269aebd98aSStefan Weil             memcpy(block + sector_in_block * SECTOR_SIZE,
627a7a43aa1SPaolo Bonzini                    buf, n_sectors * SECTOR_SIZE);
628641543b7SStefan Weil             memset(block + (sector_in_block + n_sectors) * SECTOR_SIZE, 0,
629641543b7SStefan Weil                    (s->block_sectors - n_sectors - sector_in_block) * SECTOR_SIZE);
6304eea78e6SPaolo Bonzini             ret = bdrv_write(bs->file, offset, block, s->block_sectors);
6319aebd98aSStefan Weil         } else {
6329aebd98aSStefan Weil             uint64_t offset = s->header.offset_data / SECTOR_SIZE +
6339aebd98aSStefan Weil                               (uint64_t)bmap_entry * s->block_sectors +
6349aebd98aSStefan Weil                               sector_in_block;
6354eea78e6SPaolo Bonzini             ret = bdrv_write(bs->file, offset, buf, n_sectors);
6369aebd98aSStefan Weil         }
6370c7bfc32SPaolo Bonzini 
638bfc45fc1SPaolo Bonzini         nb_sectors -= n_sectors;
639bfc45fc1SPaolo Bonzini         sector_num += n_sectors;
640a7a43aa1SPaolo Bonzini         buf += n_sectors * SECTOR_SIZE;
6410c7bfc32SPaolo Bonzini 
642bfc45fc1SPaolo Bonzini         logout("%u sectors written\n", n_sectors);
6433d46a75aSPaolo Bonzini     }
6449aebd98aSStefan Weil 
6450c7bfc32SPaolo Bonzini     logout("finished data write\n");
6464eea78e6SPaolo Bonzini     if (ret < 0) {
6474eea78e6SPaolo Bonzini         return ret;
6484eea78e6SPaolo Bonzini     }
6494eea78e6SPaolo Bonzini 
650bfc45fc1SPaolo Bonzini     if (block) {
6514eea78e6SPaolo Bonzini         /* One or more new blocks were allocated. */
652bfc45fc1SPaolo Bonzini         VdiHeader *header = (VdiHeader *) block;
6534eea78e6SPaolo Bonzini         uint8_t *base;
6544eea78e6SPaolo Bonzini         uint64_t offset;
6554eea78e6SPaolo Bonzini 
6560c7bfc32SPaolo Bonzini         logout("now writing modified header\n");
657bfc45fc1SPaolo Bonzini         assert(VDI_IS_ALLOCATED(bmap_first));
6580c7bfc32SPaolo Bonzini         *header = s->header;
6590c7bfc32SPaolo Bonzini         vdi_header_to_le(header);
6604eea78e6SPaolo Bonzini         ret = bdrv_write(bs->file, 0, block, 1);
661bfc45fc1SPaolo Bonzini         g_free(block);
662bfc45fc1SPaolo Bonzini         block = NULL;
6634eea78e6SPaolo Bonzini 
6644eea78e6SPaolo Bonzini         if (ret < 0) {
6654eea78e6SPaolo Bonzini             return ret;
6664eea78e6SPaolo Bonzini         }
6674eea78e6SPaolo Bonzini 
6680c7bfc32SPaolo Bonzini         logout("now writing modified block map entry %u...%u\n",
6690c7bfc32SPaolo Bonzini                bmap_first, bmap_last);
6700c7bfc32SPaolo Bonzini         /* Write modified sectors from block map. */
6710c7bfc32SPaolo Bonzini         bmap_first /= (SECTOR_SIZE / sizeof(uint32_t));
6720c7bfc32SPaolo Bonzini         bmap_last /= (SECTOR_SIZE / sizeof(uint32_t));
6730c7bfc32SPaolo Bonzini         n_sectors = bmap_last - bmap_first + 1;
6740c7bfc32SPaolo Bonzini         offset = s->bmap_sector + bmap_first;
6754eea78e6SPaolo Bonzini         base = ((uint8_t *)&s->bmap[0]) + bmap_first * SECTOR_SIZE;
6760c7bfc32SPaolo Bonzini         logout("will write %u block map sectors starting from entry %u\n",
6770c7bfc32SPaolo Bonzini                n_sectors, bmap_first);
6784eea78e6SPaolo Bonzini         ret = bdrv_write(bs->file, offset, base, n_sectors);
6790c7bfc32SPaolo Bonzini     }
6800c7bfc32SPaolo Bonzini 
6813d46a75aSPaolo Bonzini     return ret;
6829aebd98aSStefan Weil }
6839aebd98aSStefan Weil 
684004b7f25SChunyan Liu static int vdi_create(const char *filename, QemuOpts *opts, Error **errp)
6859aebd98aSStefan Weil {
686dddc7750SJeff Cody     int ret = 0;
6879aebd98aSStefan Weil     uint64_t bytes = 0;
6889aebd98aSStefan Weil     uint32_t blocks;
68999cce9faSKevin Wolf     size_t block_size = DEFAULT_CLUSTER_SIZE;
6909aebd98aSStefan Weil     uint32_t image_type = VDI_TYPE_DYNAMIC;
6919aebd98aSStefan Weil     VdiHeader header;
6929aebd98aSStefan Weil     size_t i;
6939aebd98aSStefan Weil     size_t bmap_size;
69470747862SJeff Cody     int64_t offset = 0;
69570747862SJeff Cody     Error *local_err = NULL;
69670747862SJeff Cody     BlockDriverState *bs = NULL;
69770747862SJeff Cody     uint32_t *bmap = NULL;
6989aebd98aSStefan Weil 
6999aebd98aSStefan Weil     logout("\n");
7009aebd98aSStefan Weil 
7019aebd98aSStefan Weil     /* Read out options. */
702c2eb918eSHu Tao     bytes = ROUND_UP(qemu_opt_get_size_del(opts, BLOCK_OPT_SIZE, 0),
703c2eb918eSHu Tao                      BDRV_SECTOR_SIZE);
7049aebd98aSStefan Weil #if defined(CONFIG_VDI_BLOCK_SIZE)
7059aebd98aSStefan Weil     /* TODO: Additional checks (SECTOR_SIZE * 2^n, ...). */
706004b7f25SChunyan Liu     block_size = qemu_opt_get_size_del(opts,
707004b7f25SChunyan Liu                                        BLOCK_OPT_CLUSTER_SIZE,
708004b7f25SChunyan Liu                                        DEFAULT_CLUSTER_SIZE);
7099aebd98aSStefan Weil #endif
7109aebd98aSStefan Weil #if defined(CONFIG_VDI_STATIC_IMAGE)
711004b7f25SChunyan Liu     if (qemu_opt_get_bool_del(opts, BLOCK_OPT_STATIC, false)) {
7129aebd98aSStefan Weil         image_type = VDI_TYPE_STATIC;
7136eea90ebSStefan Weil     }
7149aebd98aSStefan Weil #endif
7159aebd98aSStefan Weil 
71663fa06dcSJeff Cody     if (bytes > VDI_DISK_SIZE_MAX) {
717dddc7750SJeff Cody         ret = -ENOTSUP;
71863fa06dcSJeff Cody         error_setg(errp, "Unsupported VDI image size (size is 0x%" PRIx64
71963fa06dcSJeff Cody                           ", max supported is 0x%" PRIx64 ")",
72063fa06dcSJeff Cody                           bytes, VDI_DISK_SIZE_MAX);
72163fa06dcSJeff Cody         goto exit;
72263fa06dcSJeff Cody     }
72363fa06dcSJeff Cody 
724dddc7750SJeff Cody     ret = bdrv_create_file(filename, opts, &local_err);
725dddc7750SJeff Cody     if (ret < 0) {
72670747862SJeff Cody         error_propagate(errp, local_err);
72763fa06dcSJeff Cody         goto exit;
7289aebd98aSStefan Weil     }
729dddc7750SJeff Cody     ret = bdrv_open(&bs, filename, NULL, NULL, BDRV_O_RDWR | BDRV_O_PROTOCOL,
73070747862SJeff Cody                     NULL, &local_err);
731dddc7750SJeff Cody     if (ret < 0) {
73270747862SJeff Cody         error_propagate(errp, local_err);
73370747862SJeff Cody         goto exit;
7344ab15590SChunyan Liu     }
7354ab15590SChunyan Liu 
736f21dc3a4SStefan Weil     /* We need enough blocks to store the given disk size,
737f21dc3a4SStefan Weil        so always round up. */
738*e9082e47SMax Reitz     blocks = DIV_ROUND_UP(bytes, block_size);
739f21dc3a4SStefan Weil 
7409aebd98aSStefan Weil     bmap_size = blocks * sizeof(uint32_t);
741*e9082e47SMax Reitz     bmap_size = ROUND_UP(bmap_size, SECTOR_SIZE);
7429aebd98aSStefan Weil 
7439aebd98aSStefan Weil     memset(&header, 0, sizeof(header));
7441786dc15SBlue Swirl     pstrcpy(header.text, sizeof(header.text), VDI_TEXT);
7459aebd98aSStefan Weil     header.signature = VDI_SIGNATURE;
7469aebd98aSStefan Weil     header.version = VDI_VERSION_1_1;
7479aebd98aSStefan Weil     header.header_size = 0x180;
7489aebd98aSStefan Weil     header.image_type = image_type;
7499aebd98aSStefan Weil     header.offset_bmap = 0x200;
7509aebd98aSStefan Weil     header.offset_data = 0x200 + bmap_size;
7519aebd98aSStefan Weil     header.sector_size = SECTOR_SIZE;
7529aebd98aSStefan Weil     header.disk_size = bytes;
7539aebd98aSStefan Weil     header.block_size = block_size;
7549aebd98aSStefan Weil     header.blocks_in_image = blocks;
7556eea90ebSStefan Weil     if (image_type == VDI_TYPE_STATIC) {
7566eea90ebSStefan Weil         header.blocks_allocated = blocks;
7576eea90ebSStefan Weil     }
7589aebd98aSStefan Weil     uuid_generate(header.uuid_image);
7599aebd98aSStefan Weil     uuid_generate(header.uuid_last_snap);
7609aebd98aSStefan Weil     /* There is no need to set header.uuid_link or header.uuid_parent here. */
7619aebd98aSStefan Weil #if defined(CONFIG_VDI_DEBUG)
7629aebd98aSStefan Weil     vdi_header_print(&header);
7639aebd98aSStefan Weil #endif
7649aebd98aSStefan Weil     vdi_header_to_le(&header);
765dddc7750SJeff Cody     ret = bdrv_pwrite_sync(bs, offset, &header, sizeof(header));
766dddc7750SJeff Cody     if (ret < 0) {
76770747862SJeff Cody         error_setg(errp, "Error writing header to %s", filename);
76870747862SJeff Cody         goto exit;
7699aebd98aSStefan Weil     }
77070747862SJeff Cody     offset += sizeof(header);
7719aebd98aSStefan Weil 
772b76b6e95SStefan Weil     if (bmap_size > 0) {
77317cce735SKevin Wolf         bmap = g_try_malloc0(bmap_size);
77417cce735SKevin Wolf         if (bmap == NULL) {
77517cce735SKevin Wolf             ret = -ENOMEM;
77617cce735SKevin Wolf             error_setg(errp, "Could not allocate bmap");
77717cce735SKevin Wolf             goto exit;
77817cce735SKevin Wolf         }
7799aebd98aSStefan Weil         for (i = 0; i < blocks; i++) {
7809aebd98aSStefan Weil             if (image_type == VDI_TYPE_STATIC) {
7819aebd98aSStefan Weil                 bmap[i] = i;
7829aebd98aSStefan Weil             } else {
7839aebd98aSStefan Weil                 bmap[i] = VDI_UNALLOCATED;
7849aebd98aSStefan Weil             }
7859aebd98aSStefan Weil         }
786dddc7750SJeff Cody         ret = bdrv_pwrite_sync(bs, offset, bmap, bmap_size);
787dddc7750SJeff Cody         if (ret < 0) {
78870747862SJeff Cody             error_setg(errp, "Error writing bmap to %s", filename);
78970747862SJeff Cody             goto exit;
7909aebd98aSStefan Weil         }
79170747862SJeff Cody         offset += bmap_size;
792514f21a5SStefan Weil     }
793514f21a5SStefan Weil 
7949aebd98aSStefan Weil     if (image_type == VDI_TYPE_STATIC) {
795dddc7750SJeff Cody         ret = bdrv_truncate(bs, offset + blocks * block_size);
796dddc7750SJeff Cody         if (ret < 0) {
79770747862SJeff Cody             error_setg(errp, "Failed to statically allocate %s", filename);
79870747862SJeff Cody             goto exit;
7999aebd98aSStefan Weil         }
8009aebd98aSStefan Weil     }
8019aebd98aSStefan Weil 
80263fa06dcSJeff Cody exit:
80370747862SJeff Cody     bdrv_unref(bs);
80470747862SJeff Cody     g_free(bmap);
805dddc7750SJeff Cody     return ret;
8069aebd98aSStefan Weil }
8079aebd98aSStefan Weil 
8089aebd98aSStefan Weil static void vdi_close(BlockDriverState *bs)
8099aebd98aSStefan Weil {
810fc9d106cSKevin Wolf     BDRVVdiState *s = bs->opaque;
8116ac5f388SKevin Wolf 
81217cce735SKevin Wolf     qemu_vfree(s->bmap);
8136ac5f388SKevin Wolf 
814fc9d106cSKevin Wolf     migrate_del_blocker(s->migration_blocker);
815fc9d106cSKevin Wolf     error_free(s->migration_blocker);
8169aebd98aSStefan Weil }
8179aebd98aSStefan Weil 
818004b7f25SChunyan Liu static QemuOptsList vdi_create_opts = {
819004b7f25SChunyan Liu     .name = "vdi-create-opts",
820004b7f25SChunyan Liu     .head = QTAILQ_HEAD_INITIALIZER(vdi_create_opts.head),
821004b7f25SChunyan Liu     .desc = {
8229aebd98aSStefan Weil         {
8239aebd98aSStefan Weil             .name = BLOCK_OPT_SIZE,
824004b7f25SChunyan Liu             .type = QEMU_OPT_SIZE,
8259aebd98aSStefan Weil             .help = "Virtual disk size"
8269aebd98aSStefan Weil         },
8279aebd98aSStefan Weil #if defined(CONFIG_VDI_BLOCK_SIZE)
8289aebd98aSStefan Weil         {
8299aebd98aSStefan Weil             .name = BLOCK_OPT_CLUSTER_SIZE,
830004b7f25SChunyan Liu             .type = QEMU_OPT_SIZE,
83199cce9faSKevin Wolf             .help = "VDI cluster (block) size",
832004b7f25SChunyan Liu             .def_value_str = stringify(DEFAULT_CLUSTER_SIZE)
8339aebd98aSStefan Weil         },
8349aebd98aSStefan Weil #endif
8359aebd98aSStefan Weil #if defined(CONFIG_VDI_STATIC_IMAGE)
8369aebd98aSStefan Weil         {
8379aebd98aSStefan Weil             .name = BLOCK_OPT_STATIC,
838004b7f25SChunyan Liu             .type = QEMU_OPT_BOOL,
839004b7f25SChunyan Liu             .help = "VDI static (pre-allocated) image",
840004b7f25SChunyan Liu             .def_value_str = "off"
8419aebd98aSStefan Weil         },
8429aebd98aSStefan Weil #endif
8434ab15590SChunyan Liu         {
8444ab15590SChunyan Liu             .name = BLOCK_OPT_NOCOW,
8454ab15590SChunyan Liu             .type = QEMU_OPT_BOOL,
8464ab15590SChunyan Liu             .help = "Turn off copy-on-write (valid only on btrfs)"
8474ab15590SChunyan Liu         },
8489aebd98aSStefan Weil         /* TODO: An additional option to set UUID values might be useful. */
849004b7f25SChunyan Liu         { /* end of list */ }
850004b7f25SChunyan Liu     }
8519aebd98aSStefan Weil };
8529aebd98aSStefan Weil 
8539aebd98aSStefan Weil static BlockDriver bdrv_vdi = {
8549aebd98aSStefan Weil     .format_name = "vdi",
8559aebd98aSStefan Weil     .instance_size = sizeof(BDRVVdiState),
8569aebd98aSStefan Weil     .bdrv_probe = vdi_probe,
8579aebd98aSStefan Weil     .bdrv_open = vdi_open,
8589aebd98aSStefan Weil     .bdrv_close = vdi_close,
859ecfe2bbaSJeff Cody     .bdrv_reopen_prepare = vdi_reopen_prepare,
860c282e1fdSChunyan Liu     .bdrv_create = vdi_create,
8613ac21627SPeter Lieven     .bdrv_has_zero_init = bdrv_has_zero_init_1,
862b6b8a333SPaolo Bonzini     .bdrv_co_get_block_status = vdi_co_get_block_status,
8639aebd98aSStefan Weil     .bdrv_make_empty = vdi_make_empty,
8649aebd98aSStefan Weil 
865a7a43aa1SPaolo Bonzini     .bdrv_read = vdi_co_read,
8669aebd98aSStefan Weil #if defined(CONFIG_VDI_WRITE)
867a7a43aa1SPaolo Bonzini     .bdrv_write = vdi_co_write,
8689aebd98aSStefan Weil #endif
8699aebd98aSStefan Weil 
8709aebd98aSStefan Weil     .bdrv_get_info = vdi_get_info,
8719aebd98aSStefan Weil 
872004b7f25SChunyan Liu     .create_opts = &vdi_create_opts,
8739aebd98aSStefan Weil     .bdrv_check = vdi_check,
8749aebd98aSStefan Weil };
8759aebd98aSStefan Weil 
8769aebd98aSStefan Weil static void bdrv_vdi_init(void)
8779aebd98aSStefan Weil {
8789aebd98aSStefan Weil     logout("\n");
8799aebd98aSStefan Weil     bdrv_register(&bdrv_vdi);
8809aebd98aSStefan Weil }
8819aebd98aSStefan Weil 
8829aebd98aSStefan Weil block_init(bdrv_vdi_init);
883