xref: /qemu/qemu-nbd.c (revision b25e12da)
1cd831bd7Sths /*
27a5ca864Sbellard  *  Copyright (C) 2005  Anthony Liguori <anthony@codemonkey.ws>
37a5ca864Sbellard  *
47a5ca864Sbellard  *  Network Block Device
57a5ca864Sbellard  *
67a5ca864Sbellard  *  This program is free software; you can redistribute it and/or modify
77a5ca864Sbellard  *  it under the terms of the GNU General Public License as published by
87a5ca864Sbellard  *  the Free Software Foundation; under version 2 of the License.
97a5ca864Sbellard  *
107a5ca864Sbellard  *  This program is distributed in the hope that it will be useful,
117a5ca864Sbellard  *  but WITHOUT ANY WARRANTY; without even the implied warranty of
127a5ca864Sbellard  *  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
137a5ca864Sbellard  *  GNU General Public License for more details.
147a5ca864Sbellard  *
157a5ca864Sbellard  *  You should have received a copy of the GNU General Public License
168167ee88SBlue Swirl  *  along with this program; if not, see <http://www.gnu.org/licenses/>.
177a5ca864Sbellard  */
187a5ca864Sbellard 
19d38ea87aSPeter Maydell #include "qemu/osdep.h"
20c2a3d7daSEric Blake #include <getopt.h>
21c2a3d7daSEric Blake #include <libgen.h>
22c2a3d7daSEric Blake #include <pthread.h>
23c2a3d7daSEric Blake 
24da34e65cSMarkus Armbruster #include "qapi/error.h"
25f348b6d1SVeronia Bahaa #include "qemu/cutils.h"
2626f54e9aSMarkus Armbruster #include "sysemu/block-backend.h"
27b3838a40SPeter Lieven #include "block/block_int.h"
28737e150eSPaolo Bonzini #include "block/nbd.h"
296a1751b7SAlex Bligh #include "qemu/main-loop.h"
30922a01a0SMarkus Armbruster #include "qemu/option.h"
31537b41f5SPaolo Bonzini #include "qemu/error-report.h"
320ab3b337SDaniel P. Berrange #include "qemu/config-file.h"
3358369e22SPaolo Bonzini #include "qemu/bswap.h"
3439ca463eSDenis V. Lunev #include "qemu/log.h"
3553fabd4bSPaolo Bonzini #include "qemu/systemd.h"
368c116b0eSWenchao Xia #include "block/snapshot.h"
37452fcdbcSMarkus Armbruster #include "qapi/qmp/qdict.h"
38d49b6836SMarkus Armbruster #include "qapi/qmp/qstring.h"
390ab3b337SDaniel P. Berrange #include "qom/object_interfaces.h"
40d0d6ff58SDaniel P. Berrange #include "io/channel-socket.h"
41e4849c1dSDaniel P. Berrange #include "io/net-listener.h"
42c2297088SDaniel P. Berrange #include "crypto/init.h"
4339ca463eSDenis V. Lunev #include "trace/control.h"
44be377133SEric Blake #include "qemu-version.h"
457a5ca864Sbellard 
463c1fa35dSEric Blake #ifdef __linux__
473c1fa35dSEric Blake #define HAVE_NBD_DEVICE 1
483c1fa35dSEric Blake #else
493c1fa35dSEric Blake #define HAVE_NBD_DEVICE 0
503c1fa35dSEric Blake #endif
513c1fa35dSEric Blake 
52cd831bd7Sths #define SOCKET_PATH                "/var/lock/qemu-nbd-%s"
53fa8b7ce2SDaniel P. Berrange #define QEMU_NBD_OPT_CACHE         256
54fa8b7ce2SDaniel P. Berrange #define QEMU_NBD_OPT_AIO           257
55fa8b7ce2SDaniel P. Berrange #define QEMU_NBD_OPT_DISCARD       258
56fa8b7ce2SDaniel P. Berrange #define QEMU_NBD_OPT_DETECT_ZEROES 259
57fa8b7ce2SDaniel P. Berrange #define QEMU_NBD_OPT_OBJECT        260
58fa8b7ce2SDaniel P. Berrange #define QEMU_NBD_OPT_TLSCREDS      261
59fa8b7ce2SDaniel P. Berrange #define QEMU_NBD_OPT_IMAGE_OPTS    262
60ffb31e1dSMax Reitz #define QEMU_NBD_OPT_FORK          263
61*b25e12daSDaniel P. Berrange #define QEMU_NBD_OPT_TLSAUTHZ      264
627a5ca864Sbellard 
63bd31c214SEric Blake #define MBR_SIZE 512
64bd31c214SEric Blake 
659d976580SPhilippe Mathieu-Daudé static NBDExport *export;
66b1d8e52eSblueswir1 static int verbose;
67a517e88bSPaolo Bonzini static char *srcpath;
68bd269ebcSMarkus Armbruster static SocketAddress *saddr;
697860a380SPaolo Bonzini static int persistent = 0;
707860a380SPaolo Bonzini static enum { RUNNING, TERMINATE, TERMINATING, TERMINATED } state;
71a61c6782SPaolo Bonzini static int shared = 1;
72a61c6782SPaolo Bonzini static int nb_fds;
73e4849c1dSDaniel P. Berrange static QIONetListener *server;
74145614a1SDaniel P. Berrange static QCryptoTLSCreds *tlscreds;
75*b25e12daSDaniel P. Berrange static const char *tlsauthz;
767a5ca864Sbellard 
777a5ca864Sbellard static void usage(const char *name)
787a5ca864Sbellard {
79b033cd86SPaolo Bonzini     (printf) (
807a5ca864Sbellard "Usage: %s [OPTIONS] FILE\n"
8168b96f15SEric Blake "  or:  %s -L [OPTIONS]\n"
8268b96f15SEric Blake "QEMU Disk Network Block Device Utility\n"
837a5ca864Sbellard "\n"
847a5ca864Sbellard "  -h, --help                display this help and exit\n"
857a5ca864Sbellard "  -V, --version             output version information and exit\n"
867a5ca864Sbellard "\n"
87b033cd86SPaolo Bonzini "Connection properties:\n"
88b033cd86SPaolo Bonzini "  -p, --port=PORT           port to listen on (default `%d')\n"
89b033cd86SPaolo Bonzini "  -b, --bind=IFACE          interface to bind to (default `0.0.0.0')\n"
90b033cd86SPaolo Bonzini "  -k, --socket=PATH         path to the unix socket\n"
91b033cd86SPaolo Bonzini "                            (default '"SOCKET_PATH"')\n"
92b033cd86SPaolo Bonzini "  -e, --shared=NUM          device can be shared by NUM clients (default '1')\n"
93b033cd86SPaolo Bonzini "  -t, --persistent          don't exit on the last connection\n"
94b033cd86SPaolo Bonzini "  -v, --verbose             display extra debugging information\n"
95f5cd0bb5SVladimir Sementsov-Ogievskiy "  -x, --export-name=NAME    expose export by name (default is empty string)\n"
96f5cd0bb5SVladimir Sementsov-Ogievskiy "  -D, --description=TEXT    export a human-readable description\n"
97b033cd86SPaolo Bonzini "\n"
98b033cd86SPaolo Bonzini "Exposing part of the image:\n"
99b033cd86SPaolo Bonzini "  -o, --offset=OFFSET       offset into the image\n"
100b033cd86SPaolo Bonzini "  -P, --partition=NUM       only expose partition NUM\n"
101636192c4SEric Blake "  -B, --bitmap=NAME         expose a persistent dirty bitmap\n"
102b033cd86SPaolo Bonzini "\n"
1030ab3b337SDaniel P. Berrange "General purpose options:\n"
10468b96f15SEric Blake "  -L, --list                list exports available from another NBD server\n"
1050ab3b337SDaniel P. Berrange "  --object type,id=ID,...   define an object such as 'secret' for providing\n"
1060ab3b337SDaniel P. Berrange "                            passwords and/or encryption keys\n"
107f7812df7SEric Blake "  --tls-creds=ID            use id of an earlier --object to provide TLS\n"
108*b25e12daSDaniel P. Berrange "  --tls-authz=ID            use id of an earlier --object to provide\n"
109*b25e12daSDaniel P. Berrange "                            authorization\n"
11039ca463eSDenis V. Lunev "  -T, --trace [[enable=]<pattern>][,events=<file>][,file=<file>]\n"
11139ca463eSDenis V. Lunev "                            specify tracing options\n"
112ffb31e1dSMax Reitz "  --fork                    fork off the server process and exit the parent\n"
113ffb31e1dSMax Reitz "                            once the server is running\n"
1143c1fa35dSEric Blake #if HAVE_NBD_DEVICE
1153c1fa35dSEric Blake "\n"
116b033cd86SPaolo Bonzini "Kernel NBD client support:\n"
117b033cd86SPaolo Bonzini "  -c, --connect=DEV         connect FILE to the local NBD device DEV\n"
118b033cd86SPaolo Bonzini "  -d, --disconnect          disconnect the specified device\n"
119b033cd86SPaolo Bonzini #endif
120b033cd86SPaolo Bonzini "\n"
121b033cd86SPaolo Bonzini "Block device options:\n"
1224323fdcfSWenchao Xia "  -f, --format=FORMAT       set image format (raw, qcow2, ...)\n"
123b033cd86SPaolo Bonzini "  -r, --read-only           export read-only\n"
1248c116b0eSWenchao Xia "  -s, --snapshot            use FILE as an external snapshot, create a temporary\n"
1258c116b0eSWenchao Xia "                            file with backing_file=FILE, redirect the write to\n"
1268c116b0eSWenchao Xia "                            the temporary one\n"
1278c116b0eSWenchao Xia "  -l, --load-snapshot=SNAPSHOT_PARAM\n"
1288c116b0eSWenchao Xia "                            load an internal snapshot inside FILE and export it\n"
1298c116b0eSWenchao Xia "                            as an read-only device, SNAPSHOT_PARAM format is\n"
1308c116b0eSWenchao Xia "                            'snapshot.id=[ID],snapshot.name=[NAME]', or\n"
1318c116b0eSWenchao Xia "                            '[ID_OR_NAME]'\n"
132b033cd86SPaolo Bonzini "  -n, --nocache             disable host cache\n"
13339a5235cSPaolo Bonzini "      --cache=MODE          set cache mode (none, writeback, ...)\n"
13439a5235cSPaolo Bonzini "      --aio=MODE            set AIO mode (native or threads)\n"
135b3838a40SPeter Lieven "      --discard=MODE        set discard mode (ignore, unmap)\n"
1366883de6cSAndrey Korolyov "      --detect-zeroes=MODE  set detect-zeroes mode (off, on, unmap)\n"
13777c9aaefSDaniel P. Berrange "      --image-opts          treat FILE as a full set of image options\n"
138b033cd86SPaolo Bonzini "\n"
139f5048cb7SEric Blake QEMU_HELP_BOTTOM "\n"
14068b96f15SEric Blake     , name, name, NBD_DEFAULT_PORT, "DEVICE");
1417a5ca864Sbellard }
1427a5ca864Sbellard 
1437a5ca864Sbellard static void version(const char *name)
1447a5ca864Sbellard {
1457a5ca864Sbellard     printf(
1467e563bfbSThomas Huth "%s " QEMU_FULL_VERSION "\n"
1477a5ca864Sbellard "Written by Anthony Liguori.\n"
1487a5ca864Sbellard "\n"
149be377133SEric Blake QEMU_COPYRIGHT "\n"
1507a5ca864Sbellard "This is free software; see the source for copying conditions.  There is NO\n"
1517a5ca864Sbellard "warranty; not even for MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.\n"
152315bc7aaSths     , name);
1537a5ca864Sbellard }
1547a5ca864Sbellard 
1557a5ca864Sbellard struct partition_record
1567a5ca864Sbellard {
1577a5ca864Sbellard     uint8_t bootable;
1587a5ca864Sbellard     uint8_t start_head;
1597a5ca864Sbellard     uint32_t start_cylinder;
1607a5ca864Sbellard     uint8_t start_sector;
1617a5ca864Sbellard     uint8_t system;
1627a5ca864Sbellard     uint8_t end_head;
1637a5ca864Sbellard     uint8_t end_cylinder;
1647a5ca864Sbellard     uint8_t end_sector;
1657a5ca864Sbellard     uint32_t start_sector_abs;
1667a5ca864Sbellard     uint32_t nb_sectors_abs;
1677a5ca864Sbellard };
1687a5ca864Sbellard 
1697a5ca864Sbellard static void read_partition(uint8_t *p, struct partition_record *r)
1707a5ca864Sbellard {
1717a5ca864Sbellard     r->bootable = p[0];
1727a5ca864Sbellard     r->start_head = p[1];
1737a5ca864Sbellard     r->start_cylinder = p[3] | ((p[2] << 2) & 0x0300);
1747a5ca864Sbellard     r->start_sector = p[2] & 0x3f;
1757a5ca864Sbellard     r->system = p[4];
1767a5ca864Sbellard     r->end_head = p[5];
1777a5ca864Sbellard     r->end_cylinder = p[7] | ((p[6] << 2) & 0x300);
1787a5ca864Sbellard     r->end_sector = p[6] & 0x3f;
179ac97393dSMax Reitz 
180773dce3cSPeter Maydell     r->start_sector_abs = ldl_le_p(p + 8);
181773dce3cSPeter Maydell     r->nb_sectors_abs   = ldl_le_p(p + 12);
1827a5ca864Sbellard }
1837a5ca864Sbellard 
1844c58e80aSMax Reitz static int find_partition(BlockBackend *blk, int partition,
1859d26dfcbSEric Blake                           uint64_t *offset, uint64_t *size)
1867a5ca864Sbellard {
1877a5ca864Sbellard     struct partition_record mbr[4];
188bd31c214SEric Blake     uint8_t data[MBR_SIZE];
1897a5ca864Sbellard     int i;
1907a5ca864Sbellard     int ext_partnum = 4;
191cb7cf0e3SRyota Ozaki     int ret;
1927a5ca864Sbellard 
193bd31c214SEric Blake     ret = blk_pread(blk, 0, data, sizeof(data));
194bd31c214SEric Blake     if (ret < 0) {
195a4699e55SMarkus Armbruster         error_report("error while reading: %s", strerror(-ret));
19685b01e09SMarkus Armbruster         exit(EXIT_FAILURE);
197cb7cf0e3SRyota Ozaki     }
1987a5ca864Sbellard 
1997a5ca864Sbellard     if (data[510] != 0x55 || data[511] != 0xaa) {
200185b4338SPaolo Bonzini         return -EINVAL;
2017a5ca864Sbellard     }
2027a5ca864Sbellard 
2037a5ca864Sbellard     for (i = 0; i < 4; i++) {
2047a5ca864Sbellard         read_partition(&data[446 + 16 * i], &mbr[i]);
2057a5ca864Sbellard 
206453b07b1SMax Reitz         if (!mbr[i].system || !mbr[i].nb_sectors_abs) {
2077a5ca864Sbellard             continue;
208453b07b1SMax Reitz         }
2097a5ca864Sbellard 
2107a5ca864Sbellard         if (mbr[i].system == 0xF || mbr[i].system == 0x5) {
2117a5ca864Sbellard             struct partition_record ext[4];
212bd31c214SEric Blake             uint8_t data1[MBR_SIZE];
2137a5ca864Sbellard             int j;
2147a5ca864Sbellard 
215bd31c214SEric Blake             ret = blk_pread(blk, mbr[i].start_sector_abs * MBR_SIZE,
216bd31c214SEric Blake                             data1, sizeof(data1));
217bd31c214SEric Blake             if (ret < 0) {
218a4699e55SMarkus Armbruster                 error_report("error while reading: %s", strerror(-ret));
21985b01e09SMarkus Armbruster                 exit(EXIT_FAILURE);
220cb7cf0e3SRyota Ozaki             }
2217a5ca864Sbellard 
2227a5ca864Sbellard             for (j = 0; j < 4; j++) {
2237a5ca864Sbellard                 read_partition(&data1[446 + 16 * j], &ext[j]);
224453b07b1SMax Reitz                 if (!ext[j].system || !ext[j].nb_sectors_abs) {
2257a5ca864Sbellard                     continue;
226453b07b1SMax Reitz                 }
2277a5ca864Sbellard 
2287a5ca864Sbellard                 if ((ext_partnum + j + 1) == partition) {
2297a5ca864Sbellard                     *offset = (uint64_t)ext[j].start_sector_abs << 9;
2307a5ca864Sbellard                     *size = (uint64_t)ext[j].nb_sectors_abs << 9;
2317a5ca864Sbellard                     return 0;
2327a5ca864Sbellard                 }
2337a5ca864Sbellard             }
2347a5ca864Sbellard             ext_partnum += 4;
2357a5ca864Sbellard         } else if ((i + 1) == partition) {
2367a5ca864Sbellard             *offset = (uint64_t)mbr[i].start_sector_abs << 9;
2377a5ca864Sbellard             *size = (uint64_t)mbr[i].nb_sectors_abs << 9;
2387a5ca864Sbellard             return 0;
2397a5ca864Sbellard         }
2407a5ca864Sbellard     }
2417a5ca864Sbellard 
242185b4338SPaolo Bonzini     return -ENOENT;
2437a5ca864Sbellard }
2447a5ca864Sbellard 
245bb345110SPaolo Bonzini static void termsig_handler(int signum)
246bb345110SPaolo Bonzini {
24723994a5fSPavel Butsykin     atomic_cmpxchg(&state, RUNNING, TERMINATE);
248a61c6782SPaolo Bonzini     qemu_notify_event();
249bb345110SPaolo Bonzini }
250bb345110SPaolo Bonzini 
251537b41f5SPaolo Bonzini 
25268b96f15SEric Blake static int qemu_nbd_client_list(SocketAddress *saddr, QCryptoTLSCreds *tls,
25368b96f15SEric Blake                                 const char *hostname)
25468b96f15SEric Blake {
25568b96f15SEric Blake     int ret = EXIT_FAILURE;
25668b96f15SEric Blake     int rc;
25768b96f15SEric Blake     Error *err = NULL;
25868b96f15SEric Blake     QIOChannelSocket *sioc;
25968b96f15SEric Blake     NBDExportInfo *list;
26068b96f15SEric Blake     int i, j;
26168b96f15SEric Blake 
26268b96f15SEric Blake     sioc = qio_channel_socket_new();
26368b96f15SEric Blake     if (qio_channel_socket_connect_sync(sioc, saddr, &err) < 0) {
26468b96f15SEric Blake         error_report_err(err);
26568b96f15SEric Blake         return EXIT_FAILURE;
26668b96f15SEric Blake     }
26768b96f15SEric Blake     rc = nbd_receive_export_list(QIO_CHANNEL(sioc), tls, hostname, &list,
26868b96f15SEric Blake                                  &err);
26968b96f15SEric Blake     if (rc < 0) {
27068b96f15SEric Blake         if (err) {
27168b96f15SEric Blake             error_report_err(err);
27268b96f15SEric Blake         }
27368b96f15SEric Blake         goto out;
27468b96f15SEric Blake     }
27568b96f15SEric Blake     printf("exports available: %d\n", rc);
27668b96f15SEric Blake     for (i = 0; i < rc; i++) {
27768b96f15SEric Blake         printf(" export: '%s'\n", list[i].name);
27868b96f15SEric Blake         if (list[i].description && *list[i].description) {
27968b96f15SEric Blake             printf("  description: %s\n", list[i].description);
28068b96f15SEric Blake         }
28168b96f15SEric Blake         if (list[i].flags & NBD_FLAG_HAS_FLAGS) {
28268b96f15SEric Blake             printf("  size:  %" PRIu64 "\n", list[i].size);
28368b96f15SEric Blake             printf("  flags: 0x%x (", list[i].flags);
28468b96f15SEric Blake             if (list[i].flags & NBD_FLAG_READ_ONLY) {
28568b96f15SEric Blake                 printf(" readonly");
28668b96f15SEric Blake             }
28768b96f15SEric Blake             if (list[i].flags & NBD_FLAG_SEND_FLUSH) {
28868b96f15SEric Blake                 printf(" flush");
28968b96f15SEric Blake             }
29068b96f15SEric Blake             if (list[i].flags & NBD_FLAG_SEND_FUA) {
29168b96f15SEric Blake                 printf(" fua");
29268b96f15SEric Blake             }
29368b96f15SEric Blake             if (list[i].flags & NBD_FLAG_ROTATIONAL) {
29468b96f15SEric Blake                 printf(" rotational");
29568b96f15SEric Blake             }
29668b96f15SEric Blake             if (list[i].flags & NBD_FLAG_SEND_TRIM) {
29768b96f15SEric Blake                 printf(" trim");
29868b96f15SEric Blake             }
29968b96f15SEric Blake             if (list[i].flags & NBD_FLAG_SEND_WRITE_ZEROES) {
30068b96f15SEric Blake                 printf(" zeroes");
30168b96f15SEric Blake             }
30268b96f15SEric Blake             if (list[i].flags & NBD_FLAG_SEND_DF) {
30368b96f15SEric Blake                 printf(" df");
30468b96f15SEric Blake             }
30568b96f15SEric Blake             if (list[i].flags & NBD_FLAG_CAN_MULTI_CONN) {
30668b96f15SEric Blake                 printf(" multi");
30768b96f15SEric Blake             }
30868b96f15SEric Blake             if (list[i].flags & NBD_FLAG_SEND_RESIZE) {
30968b96f15SEric Blake                 printf(" resize");
31068b96f15SEric Blake             }
31168b96f15SEric Blake             if (list[i].flags & NBD_FLAG_SEND_CACHE) {
31268b96f15SEric Blake                 printf(" cache");
31368b96f15SEric Blake             }
31468b96f15SEric Blake             printf(" )\n");
31568b96f15SEric Blake         }
31668b96f15SEric Blake         if (list[i].min_block) {
31768b96f15SEric Blake             printf("  min block: %u\n", list[i].min_block);
31868b96f15SEric Blake             printf("  opt block: %u\n", list[i].opt_block);
31968b96f15SEric Blake             printf("  max block: %u\n", list[i].max_block);
32068b96f15SEric Blake         }
32168b96f15SEric Blake         if (list[i].n_contexts) {
32268b96f15SEric Blake             printf("  available meta contexts: %d\n", list[i].n_contexts);
32368b96f15SEric Blake             for (j = 0; j < list[i].n_contexts; j++) {
32468b96f15SEric Blake                 printf("   %s\n", list[i].contexts[j]);
32568b96f15SEric Blake             }
32668b96f15SEric Blake         }
32768b96f15SEric Blake     }
32868b96f15SEric Blake     nbd_free_export_list(list, rc);
32968b96f15SEric Blake 
33068b96f15SEric Blake     ret = EXIT_SUCCESS;
33168b96f15SEric Blake  out:
33268b96f15SEric Blake     object_unref(OBJECT(sioc));
33368b96f15SEric Blake     return ret;
33468b96f15SEric Blake }
33568b96f15SEric Blake 
33668b96f15SEric Blake 
3373c1fa35dSEric Blake #if HAVE_NBD_DEVICE
338a517e88bSPaolo Bonzini static void *show_parts(void *arg)
339cd831bd7Sths {
340a6ac2313SPaolo Bonzini     char *device = arg;
341cd831bd7Sths     int nbd;
342cd831bd7Sths 
343cd831bd7Sths     /* linux just needs an open() to trigger
344cd831bd7Sths      * the partition table update
345cd831bd7Sths      * but remember to load the module with max_part != 0 :
346cd831bd7Sths      *     modprobe nbd max_part=63
347cd831bd7Sths      */
348cd831bd7Sths     nbd = open(device, O_RDWR);
349fc19f8a0SPaolo Bonzini     if (nbd >= 0) {
350cd831bd7Sths         close(nbd);
351cd831bd7Sths     }
352a517e88bSPaolo Bonzini     return NULL;
353a517e88bSPaolo Bonzini }
354a517e88bSPaolo Bonzini 
355a517e88bSPaolo Bonzini static void *nbd_client_thread(void *arg)
356a517e88bSPaolo Bonzini {
357a6ac2313SPaolo Bonzini     char *device = arg;
3586dc1667dSEric Blake     NBDExportInfo info = { .request_sizes = false, .name = g_strdup("") };
359d0d6ff58SDaniel P. Berrange     QIOChannelSocket *sioc;
360d0d6ff58SDaniel P. Berrange     int fd;
361a517e88bSPaolo Bonzini     int ret;
362a517e88bSPaolo Bonzini     pthread_t show_parts_thread;
3631ce52846SMax Reitz     Error *local_error = NULL;
364a517e88bSPaolo Bonzini 
365d0d6ff58SDaniel P. Berrange     sioc = qio_channel_socket_new();
366d0d6ff58SDaniel P. Berrange     if (qio_channel_socket_connect_sync(sioc,
367d0d6ff58SDaniel P. Berrange                                         saddr,
368d0d6ff58SDaniel P. Berrange                                         &local_error) < 0) {
36948bec07eSDaniel P. Berrange         error_report_err(local_error);
370a517e88bSPaolo Bonzini         goto out;
371a517e88bSPaolo Bonzini     }
372a517e88bSPaolo Bonzini 
3736dc1667dSEric Blake     ret = nbd_receive_negotiate(QIO_CHANNEL(sioc),
374004a89fcSEric Blake                                 NULL, NULL, NULL, &info, &local_error);
375fc19f8a0SPaolo Bonzini     if (ret < 0) {
3761ce52846SMax Reitz         if (local_error) {
37778288671SMarkus Armbruster             error_report_err(local_error);
3781ce52846SMax Reitz         }
3790c544d73SPaolo Bonzini         goto out_socket;
380a517e88bSPaolo Bonzini     }
381a517e88bSPaolo Bonzini 
382a6ac2313SPaolo Bonzini     fd = open(device, O_RDWR);
383fc19f8a0SPaolo Bonzini     if (fd < 0) {
384a6ac2313SPaolo Bonzini         /* Linux-only, we can use %m in printf.  */
385b9884681SMarkus Armbruster         error_report("Failed to open %s: %m", device);
3860c544d73SPaolo Bonzini         goto out_socket;
387a6ac2313SPaolo Bonzini     }
388a6ac2313SPaolo Bonzini 
389004a89fcSEric Blake     ret = nbd_init(fd, sioc, &info, &local_error);
390fc19f8a0SPaolo Bonzini     if (ret < 0) {
391be41c100SVladimir Sementsov-Ogievskiy         error_report_err(local_error);
3920c544d73SPaolo Bonzini         goto out_fd;
393a517e88bSPaolo Bonzini     }
394a517e88bSPaolo Bonzini 
395a517e88bSPaolo Bonzini     /* update partition table */
396a6ac2313SPaolo Bonzini     pthread_create(&show_parts_thread, NULL, show_parts, device);
397a517e88bSPaolo Bonzini 
398c1f8fdc3SPaolo Bonzini     if (verbose) {
399a517e88bSPaolo Bonzini         fprintf(stderr, "NBD device %s is now connected to %s\n",
400a517e88bSPaolo Bonzini                 device, srcpath);
401c1f8fdc3SPaolo Bonzini     } else {
402c1f8fdc3SPaolo Bonzini         /* Close stderr so that the qemu-nbd process exits.  */
403c1f8fdc3SPaolo Bonzini         dup2(STDOUT_FILENO, STDERR_FILENO);
404c1f8fdc3SPaolo Bonzini     }
405a517e88bSPaolo Bonzini 
406a517e88bSPaolo Bonzini     ret = nbd_client(fd);
407a517e88bSPaolo Bonzini     if (ret) {
4080c544d73SPaolo Bonzini         goto out_fd;
409a517e88bSPaolo Bonzini     }
410a517e88bSPaolo Bonzini     close(fd);
411d0d6ff58SDaniel P. Berrange     object_unref(OBJECT(sioc));
4126dc1667dSEric Blake     g_free(info.name);
413a517e88bSPaolo Bonzini     kill(getpid(), SIGTERM);
414a517e88bSPaolo Bonzini     return (void *) EXIT_SUCCESS;
415a517e88bSPaolo Bonzini 
4160c544d73SPaolo Bonzini out_fd:
4170c544d73SPaolo Bonzini     close(fd);
4180c544d73SPaolo Bonzini out_socket:
419d0d6ff58SDaniel P. Berrange     object_unref(OBJECT(sioc));
420a517e88bSPaolo Bonzini out:
4216dc1667dSEric Blake     g_free(info.name);
422a517e88bSPaolo Bonzini     kill(getpid(), SIGTERM);
423a517e88bSPaolo Bonzini     return (void *) EXIT_FAILURE;
424cd831bd7Sths }
4253c1fa35dSEric Blake #endif /* HAVE_NBD_DEVICE */
426cd831bd7Sths 
427e4afbf4fSFam Zheng static int nbd_can_accept(void)
428a61c6782SPaolo Bonzini {
429df8ad9f1SEric Blake     return state == RUNNING && nb_fds < shared;
430a61c6782SPaolo Bonzini }
431a61c6782SPaolo Bonzini 
4329d976580SPhilippe Mathieu-Daudé static void nbd_export_closed(NBDExport *export)
4337860a380SPaolo Bonzini {
4347860a380SPaolo Bonzini     assert(state == TERMINATING);
4357860a380SPaolo Bonzini     state = TERMINATED;
4367860a380SPaolo Bonzini }
4377860a380SPaolo Bonzini 
438d0d6ff58SDaniel P. Berrange static void nbd_update_server_watch(void);
439e4afbf4fSFam Zheng 
4400c9390d9SEric Blake static void nbd_client_closed(NBDClient *client, bool negotiated)
441a61c6782SPaolo Bonzini {
442a61c6782SPaolo Bonzini     nb_fds--;
4430c9390d9SEric Blake     if (negotiated && nb_fds == 0 && !persistent && state == RUNNING) {
4447860a380SPaolo Bonzini         state = TERMINATE;
4457860a380SPaolo Bonzini     }
446d0d6ff58SDaniel P. Berrange     nbd_update_server_watch();
4477860a380SPaolo Bonzini     nbd_client_put(client);
448a61c6782SPaolo Bonzini }
449a61c6782SPaolo Bonzini 
450e4849c1dSDaniel P. Berrange static void nbd_accept(QIONetListener *listener, QIOChannelSocket *cioc,
451e4849c1dSDaniel P. Berrange                        gpointer opaque)
452a61c6782SPaolo Bonzini {
4537860a380SPaolo Bonzini     if (state >= TERMINATE) {
454e4849c1dSDaniel P. Berrange         return;
4557860a380SPaolo Bonzini     }
4567860a380SPaolo Bonzini 
457a61c6782SPaolo Bonzini     nb_fds++;
458d0d6ff58SDaniel P. Berrange     nbd_update_server_watch();
459*b25e12daSDaniel P. Berrange     nbd_client_new(cioc, tlscreds, tlsauthz, nbd_client_closed);
460d0d6ff58SDaniel P. Berrange }
461d0d6ff58SDaniel P. Berrange 
462d0d6ff58SDaniel P. Berrange static void nbd_update_server_watch(void)
463e4afbf4fSFam Zheng {
464e4afbf4fSFam Zheng     if (nbd_can_accept()) {
465e4849c1dSDaniel P. Berrange         qio_net_listener_set_client_func(server, nbd_accept, NULL, NULL);
466e4afbf4fSFam Zheng     } else {
467e4849c1dSDaniel P. Berrange         qio_net_listener_set_client_func(server, NULL, NULL, NULL);
468e4afbf4fSFam Zheng     }
469e4afbf4fSFam Zheng }
470e4afbf4fSFam Zheng 
47148bec07eSDaniel P. Berrange 
472bd269ebcSMarkus Armbruster static SocketAddress *nbd_build_socket_address(const char *sockpath,
47348bec07eSDaniel P. Berrange                                                const char *bindto,
47448bec07eSDaniel P. Berrange                                                const char *port)
47548bec07eSDaniel P. Berrange {
476bd269ebcSMarkus Armbruster     SocketAddress *saddr;
47748bec07eSDaniel P. Berrange 
478bd269ebcSMarkus Armbruster     saddr = g_new0(SocketAddress, 1);
47948bec07eSDaniel P. Berrange     if (sockpath) {
480bd269ebcSMarkus Armbruster         saddr->type = SOCKET_ADDRESS_TYPE_UNIX;
481bd269ebcSMarkus Armbruster         saddr->u.q_unix.path = g_strdup(sockpath);
48248bec07eSDaniel P. Berrange     } else {
4830399293eSEric Blake         InetSocketAddress *inet;
484bd269ebcSMarkus Armbruster         saddr->type = SOCKET_ADDRESS_TYPE_INET;
485bd269ebcSMarkus Armbruster         inet = &saddr->u.inet;
4860399293eSEric Blake         inet->host = g_strdup(bindto);
48748bec07eSDaniel P. Berrange         if (port) {
4880399293eSEric Blake             inet->port = g_strdup(port);
48948bec07eSDaniel P. Berrange         } else  {
4900399293eSEric Blake             inet->port = g_strdup_printf("%d", NBD_DEFAULT_PORT);
49148bec07eSDaniel P. Berrange         }
49248bec07eSDaniel P. Berrange     }
49348bec07eSDaniel P. Berrange 
49448bec07eSDaniel P. Berrange     return saddr;
49548bec07eSDaniel P. Berrange }
49648bec07eSDaniel P. Berrange 
49748bec07eSDaniel P. Berrange 
49877c9aaefSDaniel P. Berrange static QemuOptsList file_opts = {
49977c9aaefSDaniel P. Berrange     .name = "file",
50077c9aaefSDaniel P. Berrange     .implied_opt_name = "file",
50177c9aaefSDaniel P. Berrange     .head = QTAILQ_HEAD_INITIALIZER(file_opts.head),
50277c9aaefSDaniel P. Berrange     .desc = {
50377c9aaefSDaniel P. Berrange         /* no elements => accept any params */
50477c9aaefSDaniel P. Berrange         { /* end of list */ }
50577c9aaefSDaniel P. Berrange     },
50677c9aaefSDaniel P. Berrange };
50777c9aaefSDaniel P. Berrange 
5080ab3b337SDaniel P. Berrange static QemuOptsList qemu_object_opts = {
5090ab3b337SDaniel P. Berrange     .name = "object",
5100ab3b337SDaniel P. Berrange     .implied_opt_name = "qom-type",
5110ab3b337SDaniel P. Berrange     .head = QTAILQ_HEAD_INITIALIZER(qemu_object_opts.head),
5120ab3b337SDaniel P. Berrange     .desc = {
5130ab3b337SDaniel P. Berrange         { }
5140ab3b337SDaniel P. Berrange     },
5150ab3b337SDaniel P. Berrange };
5160ab3b337SDaniel P. Berrange 
5170ab3b337SDaniel P. Berrange 
518145614a1SDaniel P. Berrange 
51968b96f15SEric Blake static QCryptoTLSCreds *nbd_get_tls_creds(const char *id, bool list,
52068b96f15SEric Blake                                           Error **errp)
521145614a1SDaniel P. Berrange {
522145614a1SDaniel P. Berrange     Object *obj;
523145614a1SDaniel P. Berrange     QCryptoTLSCreds *creds;
524145614a1SDaniel P. Berrange 
525145614a1SDaniel P. Berrange     obj = object_resolve_path_component(
526145614a1SDaniel P. Berrange         object_get_objects_root(), id);
527145614a1SDaniel P. Berrange     if (!obj) {
528145614a1SDaniel P. Berrange         error_setg(errp, "No TLS credentials with id '%s'",
529145614a1SDaniel P. Berrange                    id);
530145614a1SDaniel P. Berrange         return NULL;
531145614a1SDaniel P. Berrange     }
532145614a1SDaniel P. Berrange     creds = (QCryptoTLSCreds *)
533145614a1SDaniel P. Berrange         object_dynamic_cast(obj, TYPE_QCRYPTO_TLS_CREDS);
534145614a1SDaniel P. Berrange     if (!creds) {
535145614a1SDaniel P. Berrange         error_setg(errp, "Object with id '%s' is not TLS credentials",
536145614a1SDaniel P. Berrange                    id);
537145614a1SDaniel P. Berrange         return NULL;
538145614a1SDaniel P. Berrange     }
539145614a1SDaniel P. Berrange 
54068b96f15SEric Blake     if (list) {
54168b96f15SEric Blake         if (creds->endpoint != QCRYPTO_TLS_CREDS_ENDPOINT_CLIENT) {
54268b96f15SEric Blake             error_setg(errp,
54368b96f15SEric Blake                        "Expecting TLS credentials with a client endpoint");
54468b96f15SEric Blake             return NULL;
54568b96f15SEric Blake         }
54668b96f15SEric Blake     } else {
547145614a1SDaniel P. Berrange         if (creds->endpoint != QCRYPTO_TLS_CREDS_ENDPOINT_SERVER) {
548145614a1SDaniel P. Berrange             error_setg(errp,
549145614a1SDaniel P. Berrange                        "Expecting TLS credentials with a server endpoint");
550145614a1SDaniel P. Berrange             return NULL;
551145614a1SDaniel P. Berrange         }
55268b96f15SEric Blake     }
553145614a1SDaniel P. Berrange     object_ref(obj);
554145614a1SDaniel P. Berrange     return creds;
555145614a1SDaniel P. Berrange }
556145614a1SDaniel P. Berrange 
557a721f53bSRichard W.M. Jones static void setup_address_and_port(const char **address, const char **port)
558a721f53bSRichard W.M. Jones {
559a721f53bSRichard W.M. Jones     if (*address == NULL) {
560a721f53bSRichard W.M. Jones         *address = "0.0.0.0";
561a721f53bSRichard W.M. Jones     }
562a721f53bSRichard W.M. Jones 
563a721f53bSRichard W.M. Jones     if (*port == NULL) {
564a721f53bSRichard W.M. Jones         *port = stringify(NBD_DEFAULT_PORT);
565a721f53bSRichard W.M. Jones     }
566a721f53bSRichard W.M. Jones }
567a721f53bSRichard W.M. Jones 
568a721f53bSRichard W.M. Jones /*
569a721f53bSRichard W.M. Jones  * Check socket parameters compatibility when socket activation is used.
570a721f53bSRichard W.M. Jones  */
571a721f53bSRichard W.M. Jones static const char *socket_activation_validate_opts(const char *device,
572a721f53bSRichard W.M. Jones                                                    const char *sockpath,
573a721f53bSRichard W.M. Jones                                                    const char *address,
57468b96f15SEric Blake                                                    const char *port,
57568b96f15SEric Blake                                                    bool list)
576a721f53bSRichard W.M. Jones {
577a721f53bSRichard W.M. Jones     if (device != NULL) {
578a721f53bSRichard W.M. Jones         return "NBD device can't be set when using socket activation";
579a721f53bSRichard W.M. Jones     }
580a721f53bSRichard W.M. Jones 
581a721f53bSRichard W.M. Jones     if (sockpath != NULL) {
582a721f53bSRichard W.M. Jones         return "Unix socket can't be set when using socket activation";
583a721f53bSRichard W.M. Jones     }
584a721f53bSRichard W.M. Jones 
585a721f53bSRichard W.M. Jones     if (address != NULL) {
586a721f53bSRichard W.M. Jones         return "The interface can't be set when using socket activation";
587a721f53bSRichard W.M. Jones     }
588a721f53bSRichard W.M. Jones 
589a721f53bSRichard W.M. Jones     if (port != NULL) {
590a721f53bSRichard W.M. Jones         return "TCP port number can't be set when using socket activation";
591a721f53bSRichard W.M. Jones     }
592a721f53bSRichard W.M. Jones 
59368b96f15SEric Blake     if (list) {
59468b96f15SEric Blake         return "List mode is incompatible with socket activation";
59568b96f15SEric Blake     }
59668b96f15SEric Blake 
597a721f53bSRichard W.M. Jones     return NULL;
598a721f53bSRichard W.M. Jones }
599145614a1SDaniel P. Berrange 
600b3b5299dSKevin Wolf static void qemu_nbd_shutdown(void)
601b3b5299dSKevin Wolf {
602b3b5299dSKevin Wolf     job_cancel_sync_all();
603b3b5299dSKevin Wolf     bdrv_close_all();
604b3b5299dSKevin Wolf }
605b3b5299dSKevin Wolf 
6067a5ca864Sbellard int main(int argc, char **argv)
6077a5ca864Sbellard {
60826f54e9aSMarkus Armbruster     BlockBackend *blk;
6097a5ca864Sbellard     BlockDriverState *bs;
6109d26dfcbSEric Blake     uint64_t dev_offset = 0;
6117423f417SEric Blake     uint16_t nbdflags = 0;
612cd831bd7Sths     bool disconnect = false;
613a721f53bSRichard W.M. Jones     const char *bindto = NULL;
61448bec07eSDaniel P. Berrange     const char *port = NULL;
61548bec07eSDaniel P. Berrange     char *sockpath = NULL;
616a6ac2313SPaolo Bonzini     char *device = NULL;
6179d26dfcbSEric Blake     int64_t fd_size;
6188c116b0eSWenchao Xia     QemuOpts *sn_opts = NULL;
6198c116b0eSWenchao Xia     const char *sn_id_or_name = NULL;
62068b96f15SEric Blake     const char *sopt = "hVb:o:p:rsnP:c:dvk:e:f:tl:x:T:D:B:L";
6217a5ca864Sbellard     struct option lopt[] = {
622aa6e546cSDaniel P. Berrange         { "help", no_argument, NULL, 'h' },
623aa6e546cSDaniel P. Berrange         { "version", no_argument, NULL, 'V' },
624aa6e546cSDaniel P. Berrange         { "bind", required_argument, NULL, 'b' },
625aa6e546cSDaniel P. Berrange         { "port", required_argument, NULL, 'p' },
626aa6e546cSDaniel P. Berrange         { "socket", required_argument, NULL, 'k' },
627aa6e546cSDaniel P. Berrange         { "offset", required_argument, NULL, 'o' },
628aa6e546cSDaniel P. Berrange         { "read-only", no_argument, NULL, 'r' },
629aa6e546cSDaniel P. Berrange         { "partition", required_argument, NULL, 'P' },
630636192c4SEric Blake         { "bitmap", required_argument, NULL, 'B' },
631aa6e546cSDaniel P. Berrange         { "connect", required_argument, NULL, 'c' },
632aa6e546cSDaniel P. Berrange         { "disconnect", no_argument, NULL, 'd' },
63368b96f15SEric Blake         { "list", no_argument, NULL, 'L' },
634aa6e546cSDaniel P. Berrange         { "snapshot", no_argument, NULL, 's' },
635aa6e546cSDaniel P. Berrange         { "load-snapshot", required_argument, NULL, 'l' },
636aa6e546cSDaniel P. Berrange         { "nocache", no_argument, NULL, 'n' },
637aa6e546cSDaniel P. Berrange         { "cache", required_argument, NULL, QEMU_NBD_OPT_CACHE },
638aa6e546cSDaniel P. Berrange         { "aio", required_argument, NULL, QEMU_NBD_OPT_AIO },
639aa6e546cSDaniel P. Berrange         { "discard", required_argument, NULL, QEMU_NBD_OPT_DISCARD },
640aa6e546cSDaniel P. Berrange         { "detect-zeroes", required_argument, NULL,
641aa6e546cSDaniel P. Berrange           QEMU_NBD_OPT_DETECT_ZEROES },
642aa6e546cSDaniel P. Berrange         { "shared", required_argument, NULL, 'e' },
643aa6e546cSDaniel P. Berrange         { "format", required_argument, NULL, 'f' },
644aa6e546cSDaniel P. Berrange         { "persistent", no_argument, NULL, 't' },
645aa6e546cSDaniel P. Berrange         { "verbose", no_argument, NULL, 'v' },
646aa6e546cSDaniel P. Berrange         { "object", required_argument, NULL, QEMU_NBD_OPT_OBJECT },
647aa6e546cSDaniel P. Berrange         { "export-name", required_argument, NULL, 'x' },
648b1a75b33SEric Blake         { "description", required_argument, NULL, 'D' },
649aa6e546cSDaniel P. Berrange         { "tls-creds", required_argument, NULL, QEMU_NBD_OPT_TLSCREDS },
650*b25e12daSDaniel P. Berrange         { "tls-authz", required_argument, NULL, QEMU_NBD_OPT_TLSAUTHZ },
651aa6e546cSDaniel P. Berrange         { "image-opts", no_argument, NULL, QEMU_NBD_OPT_IMAGE_OPTS },
65239ca463eSDenis V. Lunev         { "trace", required_argument, NULL, 'T' },
653ffb31e1dSMax Reitz         { "fork", no_argument, NULL, QEMU_NBD_OPT_FORK },
654660f11beSBlue Swirl         { NULL, 0, NULL, 0 }
6557a5ca864Sbellard     };
6567a5ca864Sbellard     int ch;
6577a5ca864Sbellard     int opt_ind = 0;
658f5edb014SNaphtali Sprei     int flags = BDRV_O_RDWR;
65943b51011SEric Blake     int partition = 0;
6604fbec260SMax Reitz     int ret = 0;
66139a5235cSPaolo Bonzini     bool seen_cache = false;
662ded9d2d5SPaolo Bonzini     bool seen_discard = false;
66339a5235cSPaolo Bonzini     bool seen_aio = false;
664a517e88bSPaolo Bonzini     pthread_t client_thread;
665e6b63677SDaniel P. Berrange     const char *fmt = NULL;
66634b5d2c6SMax Reitz     Error *local_err = NULL;
667b3838a40SPeter Lieven     BlockdevDetectZeroesOptions detect_zeroes = BLOCKDEV_DETECT_ZEROES_OPTIONS_OFF;
6684fbec260SMax Reitz     QDict *options = NULL;
66968b96f15SEric Blake     const char *export_name = NULL; /* defaults to "" later for server mode */
670b1a75b33SEric Blake     const char *export_description = NULL;
671636192c4SEric Blake     const char *bitmap = NULL;
672145614a1SDaniel P. Berrange     const char *tlscredsid = NULL;
67377c9aaefSDaniel P. Berrange     bool imageOpts = false;
6746effd5bfSKevin Wolf     bool writethrough = true;
67539ca463eSDenis V. Lunev     char *trace_file = NULL;
676ffb31e1dSMax Reitz     bool fork_process = false;
67768b96f15SEric Blake     bool list = false;
678ffb31e1dSMax Reitz     int old_stderr = -1;
679a721f53bSRichard W.M. Jones     unsigned socket_activation;
6807a5ca864Sbellard 
681a517e88bSPaolo Bonzini     /* The client thread uses SIGTERM to interrupt the server.  A signal
682a517e88bSPaolo Bonzini      * handler ensures that "qemu-nbd -v -c" exits with a nice status code.
683a517e88bSPaolo Bonzini      */
684bb345110SPaolo Bonzini     struct sigaction sa_sigterm;
685bb345110SPaolo Bonzini     memset(&sa_sigterm, 0, sizeof(sa_sigterm));
686bb345110SPaolo Bonzini     sa_sigterm.sa_handler = termsig_handler;
687bb345110SPaolo Bonzini     sigaction(SIGTERM, &sa_sigterm, NULL);
688c2297088SDaniel P. Berrange 
689041e32b8SMax Reitz #ifdef CONFIG_POSIX
690041e32b8SMax Reitz     signal(SIGPIPE, SIG_IGN);
691041e32b8SMax Reitz #endif
692041e32b8SMax Reitz 
693fe4db84dSDaniel P. Berrange     module_call_init(MODULE_INIT_TRACE);
6943ba1b7baSEric Blake     error_set_progname(argv[0]);
695e8f2d272SEduardo Habkost     qcrypto_init(&error_fatal);
696c2297088SDaniel P. Berrange 
6970ab3b337SDaniel P. Berrange     module_call_init(MODULE_INIT_QOM);
6980ab3b337SDaniel P. Berrange     qemu_add_opts(&qemu_object_opts);
69939ca463eSDenis V. Lunev     qemu_add_opts(&qemu_trace_opts);
70010f5bff6SFam Zheng     qemu_init_exec_dir(argv[0]);
701bb345110SPaolo Bonzini 
7027a5ca864Sbellard     while ((ch = getopt_long(argc, argv, sopt, lopt, &opt_ind)) != -1) {
7037a5ca864Sbellard         switch (ch) {
7047a5ca864Sbellard         case 's':
7052f726488Sths             flags |= BDRV_O_SNAPSHOT;
7062f726488Sths             break;
7072f726488Sths         case 'n':
70839a5235cSPaolo Bonzini             optarg = (char *) "none";
70939a5235cSPaolo Bonzini             /* fallthrough */
71039a5235cSPaolo Bonzini         case QEMU_NBD_OPT_CACHE:
71139a5235cSPaolo Bonzini             if (seen_cache) {
71285b01e09SMarkus Armbruster                 error_report("-n and --cache can only be specified once");
71385b01e09SMarkus Armbruster                 exit(EXIT_FAILURE);
71439a5235cSPaolo Bonzini             }
71539a5235cSPaolo Bonzini             seen_cache = true;
7166effd5bfSKevin Wolf             if (bdrv_parse_cache_mode(optarg, &flags, &writethrough) == -1) {
71785b01e09SMarkus Armbruster                 error_report("Invalid cache mode `%s'", optarg);
71885b01e09SMarkus Armbruster                 exit(EXIT_FAILURE);
71939a5235cSPaolo Bonzini             }
7207a5ca864Sbellard             break;
72139a5235cSPaolo Bonzini         case QEMU_NBD_OPT_AIO:
72239a5235cSPaolo Bonzini             if (seen_aio) {
72385b01e09SMarkus Armbruster                 error_report("--aio can only be specified once");
72485b01e09SMarkus Armbruster                 exit(EXIT_FAILURE);
72539a5235cSPaolo Bonzini             }
72639a5235cSPaolo Bonzini             seen_aio = true;
72739a5235cSPaolo Bonzini             if (!strcmp(optarg, "native")) {
72839a5235cSPaolo Bonzini                 flags |= BDRV_O_NATIVE_AIO;
72939a5235cSPaolo Bonzini             } else if (!strcmp(optarg, "threads")) {
73039a5235cSPaolo Bonzini                 /* this is the default */
73139a5235cSPaolo Bonzini             } else {
73285b01e09SMarkus Armbruster                error_report("invalid aio mode `%s'", optarg);
73385b01e09SMarkus Armbruster                exit(EXIT_FAILURE);
73439a5235cSPaolo Bonzini             }
73539a5235cSPaolo Bonzini             break;
736ded9d2d5SPaolo Bonzini         case QEMU_NBD_OPT_DISCARD:
737ded9d2d5SPaolo Bonzini             if (seen_discard) {
73885b01e09SMarkus Armbruster                 error_report("--discard can only be specified once");
73985b01e09SMarkus Armbruster                 exit(EXIT_FAILURE);
740ded9d2d5SPaolo Bonzini             }
741ded9d2d5SPaolo Bonzini             seen_discard = true;
742ded9d2d5SPaolo Bonzini             if (bdrv_parse_discard_flags(optarg, &flags) == -1) {
74385b01e09SMarkus Armbruster                 error_report("Invalid discard mode `%s'", optarg);
74485b01e09SMarkus Armbruster                 exit(EXIT_FAILURE);
745ded9d2d5SPaolo Bonzini             }
746ded9d2d5SPaolo Bonzini             break;
747b3838a40SPeter Lieven         case QEMU_NBD_OPT_DETECT_ZEROES:
748b3838a40SPeter Lieven             detect_zeroes =
749f7abe0ecSMarc-André Lureau                 qapi_enum_parse(&BlockdevDetectZeroesOptions_lookup,
750b3838a40SPeter Lieven                                 optarg,
751b3838a40SPeter Lieven                                 BLOCKDEV_DETECT_ZEROES_OPTIONS_OFF,
752b3838a40SPeter Lieven                                 &local_err);
753b3838a40SPeter Lieven             if (local_err) {
754c29b77f9SMarkus Armbruster                 error_reportf_err(local_err,
755c29b77f9SMarkus Armbruster                                   "Failed to parse detect_zeroes mode: ");
75685b01e09SMarkus Armbruster                 exit(EXIT_FAILURE);
757b3838a40SPeter Lieven             }
758b3838a40SPeter Lieven             if (detect_zeroes == BLOCKDEV_DETECT_ZEROES_OPTIONS_UNMAP &&
759b3838a40SPeter Lieven                 !(flags & BDRV_O_UNMAP)) {
76085b01e09SMarkus Armbruster                 error_report("setting detect-zeroes to unmap is not allowed "
761b3838a40SPeter Lieven                              "without setting discard operation to unmap");
76285b01e09SMarkus Armbruster                 exit(EXIT_FAILURE);
763b3838a40SPeter Lieven             }
764b3838a40SPeter Lieven             break;
7657a5ca864Sbellard         case 'b':
7667a5ca864Sbellard             bindto = optarg;
7677a5ca864Sbellard             break;
7687a5ca864Sbellard         case 'p':
76948bec07eSDaniel P. Berrange             port = optarg;
7707a5ca864Sbellard             break;
7717a5ca864Sbellard         case 'o':
77243b51011SEric Blake             if (qemu_strtou64(optarg, NULL, 0, &dev_offset) < 0) {
77343b51011SEric Blake                 error_report("Invalid offset '%s'", optarg);
77485b01e09SMarkus Armbruster                 exit(EXIT_FAILURE);
7757a5ca864Sbellard             }
7767a5ca864Sbellard             break;
7778c116b0eSWenchao Xia         case 'l':
7788c116b0eSWenchao Xia             if (strstart(optarg, SNAPSHOT_OPT_BASE, NULL)) {
77970b94331SMarkus Armbruster                 sn_opts = qemu_opts_parse_noisily(&internal_snapshot_opts,
78070b94331SMarkus Armbruster                                                   optarg, false);
7818c116b0eSWenchao Xia                 if (!sn_opts) {
78285b01e09SMarkus Armbruster                     error_report("Failed in parsing snapshot param `%s'",
7838c116b0eSWenchao Xia                                  optarg);
78485b01e09SMarkus Armbruster                     exit(EXIT_FAILURE);
7858c116b0eSWenchao Xia                 }
7868c116b0eSWenchao Xia             } else {
7878c116b0eSWenchao Xia                 sn_id_or_name = optarg;
7888c116b0eSWenchao Xia             }
7898c116b0eSWenchao Xia             /* fall through */
7907a5ca864Sbellard         case 'r':
791b90fb4b8SPaolo Bonzini             nbdflags |= NBD_FLAG_READ_ONLY;
79207108b29SNaphtali Sprei             flags &= ~BDRV_O_RDWR;
7937a5ca864Sbellard             break;
7947a5ca864Sbellard         case 'P':
7950ae2d546SEric Blake             warn_report("The '-P' option is deprecated; use --image-opts with "
7960ae2d546SEric Blake                         "a raw device wrapper for subset exports instead");
79743b51011SEric Blake             if (qemu_strtoi(optarg, NULL, 0, &partition) < 0 ||
79843b51011SEric Blake                 partition < 1 || partition > 8) {
79943b51011SEric Blake                 error_report("Invalid partition '%s'", optarg);
80085b01e09SMarkus Armbruster                 exit(EXIT_FAILURE);
801713cc671SPeter Lieven             }
8027a5ca864Sbellard             break;
803636192c4SEric Blake         case 'B':
804636192c4SEric Blake             bitmap = optarg;
805636192c4SEric Blake             break;
806cd831bd7Sths         case 'k':
807b32f6c28SPaolo Bonzini             sockpath = optarg;
808713cc671SPeter Lieven             if (sockpath[0] != '/') {
8099af9e0feSMarkus Armbruster                 error_report("socket path must be absolute");
81085b01e09SMarkus Armbruster                 exit(EXIT_FAILURE);
811713cc671SPeter Lieven             }
812cd831bd7Sths             break;
813cd831bd7Sths         case 'd':
814cd831bd7Sths             disconnect = true;
815cd831bd7Sths             break;
816cd831bd7Sths         case 'c':
817cd831bd7Sths             device = optarg;
818cd831bd7Sths             break;
8193b05a8e9Sths         case 'e':
82043b51011SEric Blake             if (qemu_strtoi(optarg, NULL, 0, &shared) < 0 ||
82143b51011SEric Blake                 shared < 1) {
82285b01e09SMarkus Armbruster                 error_report("Invalid shared device number '%s'", optarg);
82385b01e09SMarkus Armbruster                 exit(EXIT_FAILURE);
8243b05a8e9Sths             }
8253b05a8e9Sths             break;
826e6b63677SDaniel P. Berrange         case 'f':
827e6b63677SDaniel P. Berrange             fmt = optarg;
828e6b63677SDaniel P. Berrange             break;
82975818250Sths         case 't':
83075818250Sths             persistent = 1;
83175818250Sths             break;
8323d4b2f9cSDaniel P. Berrange         case 'x':
8333d4b2f9cSDaniel P. Berrange             export_name = optarg;
8343d4b2f9cSDaniel P. Berrange             break;
835b1a75b33SEric Blake         case 'D':
836b1a75b33SEric Blake             export_description = optarg;
837b1a75b33SEric Blake             break;
8387a5ca864Sbellard         case 'v':
8397a5ca864Sbellard             verbose = 1;
8407a5ca864Sbellard             break;
8417a5ca864Sbellard         case 'V':
8427a5ca864Sbellard             version(argv[0]);
8437a5ca864Sbellard             exit(0);
8447a5ca864Sbellard             break;
8457a5ca864Sbellard         case 'h':
8467a5ca864Sbellard             usage(argv[0]);
8477a5ca864Sbellard             exit(0);
8487a5ca864Sbellard             break;
8497a5ca864Sbellard         case '?':
85085b01e09SMarkus Armbruster             error_report("Try `%s --help' for more information.", argv[0]);
85185b01e09SMarkus Armbruster             exit(EXIT_FAILURE);
8520ab3b337SDaniel P. Berrange         case QEMU_NBD_OPT_OBJECT: {
8530ab3b337SDaniel P. Berrange             QemuOpts *opts;
8540ab3b337SDaniel P. Berrange             opts = qemu_opts_parse_noisily(&qemu_object_opts,
8550ab3b337SDaniel P. Berrange                                            optarg, true);
8560ab3b337SDaniel P. Berrange             if (!opts) {
8570ab3b337SDaniel P. Berrange                 exit(EXIT_FAILURE);
8580ab3b337SDaniel P. Berrange             }
8590ab3b337SDaniel P. Berrange         }   break;
860145614a1SDaniel P. Berrange         case QEMU_NBD_OPT_TLSCREDS:
861145614a1SDaniel P. Berrange             tlscredsid = optarg;
862145614a1SDaniel P. Berrange             break;
86377c9aaefSDaniel P. Berrange         case QEMU_NBD_OPT_IMAGE_OPTS:
86477c9aaefSDaniel P. Berrange             imageOpts = true;
86577c9aaefSDaniel P. Berrange             break;
86639ca463eSDenis V. Lunev         case 'T':
86739ca463eSDenis V. Lunev             g_free(trace_file);
86839ca463eSDenis V. Lunev             trace_file = trace_opt_parse(optarg);
86939ca463eSDenis V. Lunev             break;
870*b25e12daSDaniel P. Berrange         case QEMU_NBD_OPT_TLSAUTHZ:
871*b25e12daSDaniel P. Berrange             tlsauthz = optarg;
872*b25e12daSDaniel P. Berrange             break;
873ffb31e1dSMax Reitz         case QEMU_NBD_OPT_FORK:
874ffb31e1dSMax Reitz             fork_process = true;
875ffb31e1dSMax Reitz             break;
87668b96f15SEric Blake         case 'L':
87768b96f15SEric Blake             list = true;
87868b96f15SEric Blake             break;
8797a5ca864Sbellard         }
8807a5ca864Sbellard     }
8817a5ca864Sbellard 
88268b96f15SEric Blake     if (list) {
88368b96f15SEric Blake         if (argc != optind) {
88468b96f15SEric Blake             error_report("List mode is incompatible with a file name");
88568b96f15SEric Blake             exit(EXIT_FAILURE);
88668b96f15SEric Blake         }
88768b96f15SEric Blake         if (export_name || export_description || dev_offset || partition ||
88868b96f15SEric Blake             device || disconnect || fmt || sn_id_or_name || bitmap ||
88968b96f15SEric Blake             seen_aio || seen_discard || seen_cache) {
89068b96f15SEric Blake             error_report("List mode is incompatible with per-device settings");
89168b96f15SEric Blake             exit(EXIT_FAILURE);
89268b96f15SEric Blake         }
89368b96f15SEric Blake         if (fork_process) {
89468b96f15SEric Blake             error_report("List mode is incompatible with forking");
89568b96f15SEric Blake             exit(EXIT_FAILURE);
89668b96f15SEric Blake         }
89768b96f15SEric Blake     } else if ((argc - optind) != 1) {
898433672b0SMarkus Armbruster         error_report("Invalid number of arguments");
899433672b0SMarkus Armbruster         error_printf("Try `%s --help' for more information.\n", argv[0]);
90085b01e09SMarkus Armbruster         exit(EXIT_FAILURE);
90168b96f15SEric Blake     } else if (!export_name) {
90268b96f15SEric Blake         export_name = "";
9037a5ca864Sbellard     }
9047a5ca864Sbellard 
9057e1e0c11SMarkus Armbruster     qemu_opts_foreach(&qemu_object_opts,
9060ab3b337SDaniel P. Berrange                       user_creatable_add_opts_foreach,
9077e1e0c11SMarkus Armbruster                       NULL, &error_fatal);
9080ab3b337SDaniel P. Berrange 
90939ca463eSDenis V. Lunev     if (!trace_init_backends()) {
91039ca463eSDenis V. Lunev         exit(1);
91139ca463eSDenis V. Lunev     }
91239ca463eSDenis V. Lunev     trace_init_file(trace_file);
91339ca463eSDenis V. Lunev     qemu_set_log(LOG_TRACE);
91439ca463eSDenis V. Lunev 
915a721f53bSRichard W.M. Jones     socket_activation = check_socket_activation();
916a721f53bSRichard W.M. Jones     if (socket_activation == 0) {
917a721f53bSRichard W.M. Jones         setup_address_and_port(&bindto, &port);
918a721f53bSRichard W.M. Jones     } else {
919a721f53bSRichard W.M. Jones         /* Using socket activation - check user didn't use -p etc. */
920a721f53bSRichard W.M. Jones         const char *err_msg = socket_activation_validate_opts(device, sockpath,
92168b96f15SEric Blake                                                               bindto, port,
92268b96f15SEric Blake                                                               list);
923a721f53bSRichard W.M. Jones         if (err_msg != NULL) {
924a721f53bSRichard W.M. Jones             error_report("%s", err_msg);
925a721f53bSRichard W.M. Jones             exit(EXIT_FAILURE);
926a721f53bSRichard W.M. Jones         }
92753fabd4bSPaolo Bonzini 
92853fabd4bSPaolo Bonzini         /* qemu-nbd can only listen on a single socket.  */
92953fabd4bSPaolo Bonzini         if (socket_activation > 1) {
93053fabd4bSPaolo Bonzini             error_report("qemu-nbd does not support socket activation with %s > 1",
93153fabd4bSPaolo Bonzini                          "LISTEN_FDS");
93253fabd4bSPaolo Bonzini             exit(EXIT_FAILURE);
93353fabd4bSPaolo Bonzini         }
934a721f53bSRichard W.M. Jones     }
935a721f53bSRichard W.M. Jones 
936145614a1SDaniel P. Berrange     if (tlscredsid) {
937145614a1SDaniel P. Berrange         if (sockpath) {
938145614a1SDaniel P. Berrange             error_report("TLS is only supported with IPv4/IPv6");
939145614a1SDaniel P. Berrange             exit(EXIT_FAILURE);
940145614a1SDaniel P. Berrange         }
941145614a1SDaniel P. Berrange         if (device) {
942145614a1SDaniel P. Berrange             error_report("TLS is not supported with a host device");
943145614a1SDaniel P. Berrange             exit(EXIT_FAILURE);
944145614a1SDaniel P. Berrange         }
945*b25e12daSDaniel P. Berrange         if (tlsauthz && list) {
946*b25e12daSDaniel P. Berrange             error_report("TLS authorization is incompatible with export list");
947*b25e12daSDaniel P. Berrange             exit(EXIT_FAILURE);
948*b25e12daSDaniel P. Berrange         }
94968b96f15SEric Blake         tlscreds = nbd_get_tls_creds(tlscredsid, list, &local_err);
950145614a1SDaniel P. Berrange         if (local_err) {
951145614a1SDaniel P. Berrange             error_report("Failed to get TLS creds %s",
952145614a1SDaniel P. Berrange                          error_get_pretty(local_err));
953145614a1SDaniel P. Berrange             exit(EXIT_FAILURE);
954145614a1SDaniel P. Berrange         }
955*b25e12daSDaniel P. Berrange     } else {
956*b25e12daSDaniel P. Berrange         if (tlsauthz) {
957*b25e12daSDaniel P. Berrange             error_report("--tls-authz is not permitted without --tls-creds");
958*b25e12daSDaniel P. Berrange             exit(EXIT_FAILURE);
959*b25e12daSDaniel P. Berrange         }
960145614a1SDaniel P. Berrange     }
961145614a1SDaniel P. Berrange 
96268b96f15SEric Blake     if (list) {
96368b96f15SEric Blake         saddr = nbd_build_socket_address(sockpath, bindto, port);
96468b96f15SEric Blake         return qemu_nbd_client_list(saddr, tlscreds, bindto);
96568b96f15SEric Blake     }
96668b96f15SEric Blake 
9673c1fa35dSEric Blake #if !HAVE_NBD_DEVICE
9683c1fa35dSEric Blake     if (disconnect || device) {
9693c1fa35dSEric Blake         error_report("Kernel /dev/nbdN support not available");
9703c1fa35dSEric Blake         exit(EXIT_FAILURE);
9713c1fa35dSEric Blake     }
9723c1fa35dSEric Blake #else /* HAVE_NBD_DEVICE */
973cd831bd7Sths     if (disconnect) {
974d0d6ff58SDaniel P. Berrange         int nbdfd = open(argv[optind], O_RDWR);
975d0d6ff58SDaniel P. Berrange         if (nbdfd < 0) {
97685b01e09SMarkus Armbruster             error_report("Cannot open %s: %s", argv[optind],
97785b01e09SMarkus Armbruster                          strerror(errno));
97885b01e09SMarkus Armbruster             exit(EXIT_FAILURE);
979fc19f8a0SPaolo Bonzini         }
980d0d6ff58SDaniel P. Berrange         nbd_disconnect(nbdfd);
981cd831bd7Sths 
982d0d6ff58SDaniel P. Berrange         close(nbdfd);
983cd831bd7Sths 
984cd831bd7Sths         printf("%s disconnected\n", argv[optind]);
985cd831bd7Sths 
986cd831bd7Sths         return 0;
987cd831bd7Sths     }
9883c1fa35dSEric Blake #endif
989cd831bd7Sths 
990ffb31e1dSMax Reitz     if ((device && !verbose) || fork_process) {
991c1f8fdc3SPaolo Bonzini         int stderr_fd[2];
992c1f8fdc3SPaolo Bonzini         pid_t pid;
993c1f8fdc3SPaolo Bonzini         int ret;
994c1f8fdc3SPaolo Bonzini 
995fc19f8a0SPaolo Bonzini         if (qemu_pipe(stderr_fd) < 0) {
99685b01e09SMarkus Armbruster             error_report("Error setting up communication pipe: %s",
99785b01e09SMarkus Armbruster                          strerror(errno));
99885b01e09SMarkus Armbruster             exit(EXIT_FAILURE);
999c1f8fdc3SPaolo Bonzini         }
1000c1f8fdc3SPaolo Bonzini 
1001c1f8fdc3SPaolo Bonzini         /* Now daemonize, but keep a communication channel open to
1002c1f8fdc3SPaolo Bonzini          * print errors and exit with the proper status code.
1003c1f8fdc3SPaolo Bonzini          */
1004c1f8fdc3SPaolo Bonzini         pid = fork();
100570d4739eSMax Reitz         if (pid < 0) {
100685b01e09SMarkus Armbruster             error_report("Failed to fork: %s", strerror(errno));
100785b01e09SMarkus Armbruster             exit(EXIT_FAILURE);
100870d4739eSMax Reitz         } else if (pid == 0) {
1009c1f8fdc3SPaolo Bonzini             close(stderr_fd[0]);
10109faf31b6SMichael Tokarev             ret = qemu_daemon(1, 0);
1011c1f8fdc3SPaolo Bonzini 
1012c1f8fdc3SPaolo Bonzini             /* Temporarily redirect stderr to the parent's pipe...  */
1013ffb31e1dSMax Reitz             old_stderr = dup(STDERR_FILENO);
1014c1f8fdc3SPaolo Bonzini             dup2(stderr_fd[1], STDERR_FILENO);
1015fc19f8a0SPaolo Bonzini             if (ret < 0) {
101685b01e09SMarkus Armbruster                 error_report("Failed to daemonize: %s", strerror(errno));
101785b01e09SMarkus Armbruster                 exit(EXIT_FAILURE);
1018c1f8fdc3SPaolo Bonzini             }
1019c1f8fdc3SPaolo Bonzini 
1020c1f8fdc3SPaolo Bonzini             /* ... close the descriptor we inherited and go on.  */
1021c1f8fdc3SPaolo Bonzini             close(stderr_fd[1]);
1022c1f8fdc3SPaolo Bonzini         } else {
1023c1f8fdc3SPaolo Bonzini             bool errors = false;
1024c1f8fdc3SPaolo Bonzini             char *buf;
1025c1f8fdc3SPaolo Bonzini 
1026c1f8fdc3SPaolo Bonzini             /* In the parent.  Print error messages from the child until
1027c1f8fdc3SPaolo Bonzini              * it closes the pipe.
1028c1f8fdc3SPaolo Bonzini              */
1029c1f8fdc3SPaolo Bonzini             close(stderr_fd[1]);
1030c1f8fdc3SPaolo Bonzini             buf = g_malloc(1024);
1031c1f8fdc3SPaolo Bonzini             while ((ret = read(stderr_fd[0], buf, 1024)) > 0) {
1032c1f8fdc3SPaolo Bonzini                 errors = true;
1033c1f8fdc3SPaolo Bonzini                 ret = qemu_write_full(STDERR_FILENO, buf, ret);
1034fc19f8a0SPaolo Bonzini                 if (ret < 0) {
1035c1f8fdc3SPaolo Bonzini                     exit(EXIT_FAILURE);
1036c1f8fdc3SPaolo Bonzini                 }
1037c1f8fdc3SPaolo Bonzini             }
1038fc19f8a0SPaolo Bonzini             if (ret < 0) {
103985b01e09SMarkus Armbruster                 error_report("Cannot read from daemon: %s",
104085b01e09SMarkus Armbruster                              strerror(errno));
104185b01e09SMarkus Armbruster                 exit(EXIT_FAILURE);
1042c1f8fdc3SPaolo Bonzini             }
1043c1f8fdc3SPaolo Bonzini 
1044c1f8fdc3SPaolo Bonzini             /* Usually the daemon should not print any message.
1045c1f8fdc3SPaolo Bonzini              * Exit with zero status in that case.
1046c1f8fdc3SPaolo Bonzini              */
1047c1f8fdc3SPaolo Bonzini             exit(errors);
1048c1f8fdc3SPaolo Bonzini         }
1049c1f8fdc3SPaolo Bonzini     }
1050c1f8fdc3SPaolo Bonzini 
1051a6ac2313SPaolo Bonzini     if (device != NULL && sockpath == NULL) {
1052b32f6c28SPaolo Bonzini         sockpath = g_malloc(128);
1053b32f6c28SPaolo Bonzini         snprintf(sockpath, 128, SOCKET_PATH, basename(device));
1054cd831bd7Sths     }
1055cd831bd7Sths 
1056e4849c1dSDaniel P. Berrange     server = qio_net_listener_new();
1057a721f53bSRichard W.M. Jones     if (socket_activation == 0) {
105848bec07eSDaniel P. Berrange         saddr = nbd_build_socket_address(sockpath, bindto, port);
1059e4849c1dSDaniel P. Berrange         if (qio_net_listener_open_sync(server, saddr, &local_err) < 0) {
1060e4849c1dSDaniel P. Berrange             object_unref(OBJECT(server));
1061a721f53bSRichard W.M. Jones             error_report_err(local_err);
1062e4849c1dSDaniel P. Berrange             exit(EXIT_FAILURE);
1063a721f53bSRichard W.M. Jones         }
1064a721f53bSRichard W.M. Jones     } else {
1065e4849c1dSDaniel P. Berrange         size_t i;
1066a721f53bSRichard W.M. Jones         /* See comment in check_socket_activation above. */
1067e4849c1dSDaniel P. Berrange         for (i = 0; i < socket_activation; i++) {
1068e4849c1dSDaniel P. Berrange             QIOChannelSocket *sioc;
1069e4849c1dSDaniel P. Berrange             sioc = qio_channel_socket_new_fd(FIRST_SOCKET_ACTIVATION_FD + i,
1070a721f53bSRichard W.M. Jones                                              &local_err);
1071e4849c1dSDaniel P. Berrange             if (sioc == NULL) {
1072e4849c1dSDaniel P. Berrange                 object_unref(OBJECT(server));
1073a721f53bSRichard W.M. Jones                 error_report("Failed to use socket activation: %s",
1074a721f53bSRichard W.M. Jones                              error_get_pretty(local_err));
1075a721f53bSRichard W.M. Jones                 exit(EXIT_FAILURE);
1076a721f53bSRichard W.M. Jones             }
1077e4849c1dSDaniel P. Berrange             qio_net_listener_add(server, sioc);
1078e4849c1dSDaniel P. Berrange             object_unref(OBJECT(sioc));
1079e4849c1dSDaniel P. Berrange         }
1080a721f53bSRichard W.M. Jones     }
108148bec07eSDaniel P. Berrange 
10822f78e491SChrysostomos Nanakos     if (qemu_init_main_loop(&local_err)) {
1083565f65d2SMarkus Armbruster         error_report_err(local_err);
10842f78e491SChrysostomos Nanakos         exit(EXIT_FAILURE);
10852f78e491SChrysostomos Nanakos     }
1086802ddc37SPaolo Bonzini     bdrv_init();
1087b3b5299dSKevin Wolf     atexit(qemu_nbd_shutdown);
1088802ddc37SPaolo Bonzini 
108977c9aaefSDaniel P. Berrange     srcpath = argv[optind];
109077c9aaefSDaniel P. Berrange     if (imageOpts) {
109177c9aaefSDaniel P. Berrange         QemuOpts *opts;
109277c9aaefSDaniel P. Berrange         if (fmt) {
109377c9aaefSDaniel P. Berrange             error_report("--image-opts and -f are mutually exclusive");
109477c9aaefSDaniel P. Berrange             exit(EXIT_FAILURE);
109577c9aaefSDaniel P. Berrange         }
109677c9aaefSDaniel P. Berrange         opts = qemu_opts_parse_noisily(&file_opts, srcpath, true);
109777c9aaefSDaniel P. Berrange         if (!opts) {
109877c9aaefSDaniel P. Berrange             qemu_opts_reset(&file_opts);
109977c9aaefSDaniel P. Berrange             exit(EXIT_FAILURE);
110077c9aaefSDaniel P. Berrange         }
110177c9aaefSDaniel P. Berrange         options = qemu_opts_to_qdict(opts, NULL);
110277c9aaefSDaniel P. Berrange         qemu_opts_reset(&file_opts);
1103efaa7c4eSMax Reitz         blk = blk_new_open(NULL, NULL, options, flags, &local_err);
110477c9aaefSDaniel P. Berrange     } else {
1105e6b63677SDaniel P. Berrange         if (fmt) {
11064fbec260SMax Reitz             options = qdict_new();
110746f5ac20SEric Blake             qdict_put_str(options, "driver", fmt);
1108e6b63677SDaniel P. Berrange         }
1109efaa7c4eSMax Reitz         blk = blk_new_open(srcpath, NULL, options, flags, &local_err);
111077c9aaefSDaniel P. Berrange     }
111177c9aaefSDaniel P. Berrange 
11124fbec260SMax Reitz     if (!blk) {
1113c29b77f9SMarkus Armbruster         error_reportf_err(local_err, "Failed to blk_new_open '%s': ",
1114c29b77f9SMarkus Armbruster                           argv[optind]);
111585b01e09SMarkus Armbruster         exit(EXIT_FAILURE);
1116802ddc37SPaolo Bonzini     }
11174fbec260SMax Reitz     bs = blk_bs(blk);
1118802ddc37SPaolo Bonzini 
11196effd5bfSKevin Wolf     blk_set_enable_write_cache(blk, !writethrough);
11206effd5bfSKevin Wolf 
11218c116b0eSWenchao Xia     if (sn_opts) {
11228c116b0eSWenchao Xia         ret = bdrv_snapshot_load_tmp(bs,
11238c116b0eSWenchao Xia                                      qemu_opt_get(sn_opts, SNAPSHOT_OPT_ID),
11248c116b0eSWenchao Xia                                      qemu_opt_get(sn_opts, SNAPSHOT_OPT_NAME),
11258c116b0eSWenchao Xia                                      &local_err);
11268c116b0eSWenchao Xia     } else if (sn_id_or_name) {
11278c116b0eSWenchao Xia         ret = bdrv_snapshot_load_tmp_by_id_or_name(bs, sn_id_or_name,
11288c116b0eSWenchao Xia                                                    &local_err);
11298c116b0eSWenchao Xia     }
11308c116b0eSWenchao Xia     if (ret < 0) {
1131c29b77f9SMarkus Armbruster         error_reportf_err(local_err, "Failed to load snapshot: ");
113285b01e09SMarkus Armbruster         exit(EXIT_FAILURE);
11338c116b0eSWenchao Xia     }
11348c116b0eSWenchao Xia 
1135b3838a40SPeter Lieven     bs->detect_zeroes = detect_zeroes;
11364c58e80aSMax Reitz     fd_size = blk_getlength(blk);
113798f44bbeSMax Reitz     if (fd_size < 0) {
113885b01e09SMarkus Armbruster         error_report("Failed to determine the image length: %s",
113998f44bbeSMax Reitz                      strerror(-fd_size));
114085b01e09SMarkus Armbruster         exit(EXIT_FAILURE);
114198f44bbeSMax Reitz     }
1142802ddc37SPaolo Bonzini 
1143e424b655STomáš Golembiovský     if (dev_offset >= fd_size) {
11449d26dfcbSEric Blake         error_report("Offset (%" PRIu64 ") has to be smaller than the image "
11459d26dfcbSEric Blake                      "size (%" PRId64 ")", dev_offset, fd_size);
1146e424b655STomáš Golembiovský         exit(EXIT_FAILURE);
1147e424b655STomáš Golembiovský     }
1148e424b655STomáš Golembiovský     fd_size -= dev_offset;
1149e424b655STomáš Golembiovský 
115043b51011SEric Blake     if (partition) {
11519d26dfcbSEric Blake         uint64_t limit;
11524485936bSEric Blake 
11534485936bSEric Blake         if (dev_offset) {
11544485936bSEric Blake             error_report("Cannot request partition and offset together");
11554485936bSEric Blake             exit(EXIT_FAILURE);
11564485936bSEric Blake         }
11574485936bSEric Blake         ret = find_partition(blk, partition, &dev_offset, &limit);
1158185b4338SPaolo Bonzini         if (ret < 0) {
115985b01e09SMarkus Armbruster             error_report("Could not find partition %d: %s", partition,
1160a4699e55SMarkus Armbruster                          strerror(-ret));
116185b01e09SMarkus Armbruster             exit(EXIT_FAILURE);
1162802ddc37SPaolo Bonzini         }
11634485936bSEric Blake         /*
11644485936bSEric Blake          * MBR partition limits are (32-bit << 9); this assert lets
11659d26dfcbSEric Blake          * the compiler know that we can't overflow 64 bits.
11664485936bSEric Blake          */
11679d26dfcbSEric Blake         assert(dev_offset + limit >= dev_offset);
11684485936bSEric Blake         if (dev_offset + limit > fd_size) {
11699d26dfcbSEric Blake             error_report("Discovered partition %d at offset %" PRIu64
11709d26dfcbSEric Blake                          " size %" PRIu64 ", but size exceeds file length %"
11719d26dfcbSEric Blake                          PRId64, partition, dev_offset, limit, fd_size);
11724485936bSEric Blake             exit(EXIT_FAILURE);
11734485936bSEric Blake         }
11744485936bSEric Blake         fd_size = limit;
1175185b4338SPaolo Bonzini     }
1176802ddc37SPaolo Bonzini 
11773fa4c765SEric Blake     export = nbd_export_new(bs, dev_offset, fd_size, export_name,
1178636192c4SEric Blake                             export_description, bitmap, nbdflags,
1179678ba275SEric Blake                             nbd_export_closed, writethrough, NULL,
1180678ba275SEric Blake                             &error_fatal);
11813b05a8e9Sths 
1182f1ef5555SPaolo Bonzini     if (device) {
11833c1fa35dSEric Blake #if HAVE_NBD_DEVICE
1184f1ef5555SPaolo Bonzini         int ret;
1185f1ef5555SPaolo Bonzini 
1186a6ac2313SPaolo Bonzini         ret = pthread_create(&client_thread, NULL, nbd_client_thread, device);
1187f1ef5555SPaolo Bonzini         if (ret != 0) {
118885b01e09SMarkus Armbruster             error_report("Failed to create client thread: %s", strerror(ret));
118985b01e09SMarkus Armbruster             exit(EXIT_FAILURE);
1190f1ef5555SPaolo Bonzini         }
11913c1fa35dSEric Blake #endif
1192f1ef5555SPaolo Bonzini     } else {
1193f1ef5555SPaolo Bonzini         /* Shut up GCC warnings.  */
1194f1ef5555SPaolo Bonzini         memset(&client_thread, 0, sizeof(client_thread));
1195f1ef5555SPaolo Bonzini     }
1196f1ef5555SPaolo Bonzini 
1197d0d6ff58SDaniel P. Berrange     nbd_update_server_watch();
11987a5ca864Sbellard 
11999faf31b6SMichael Tokarev     /* now when the initialization is (almost) complete, chdir("/")
12009faf31b6SMichael Tokarev      * to free any busy filesystems */
12019faf31b6SMichael Tokarev     if (chdir("/") < 0) {
120285b01e09SMarkus Armbruster         error_report("Could not chdir to root directory: %s",
120385b01e09SMarkus Armbruster                      strerror(errno));
120485b01e09SMarkus Armbruster         exit(EXIT_FAILURE);
12059faf31b6SMichael Tokarev     }
12069faf31b6SMichael Tokarev 
1207ffb31e1dSMax Reitz     if (fork_process) {
1208ffb31e1dSMax Reitz         dup2(old_stderr, STDERR_FILENO);
1209ffb31e1dSMax Reitz         close(old_stderr);
1210ffb31e1dSMax Reitz     }
1211ffb31e1dSMax Reitz 
12127860a380SPaolo Bonzini     state = RUNNING;
12133b05a8e9Sths     do {
1214a61c6782SPaolo Bonzini         main_loop_wait(false);
12157860a380SPaolo Bonzini         if (state == TERMINATE) {
12167860a380SPaolo Bonzini             state = TERMINATING;
12179d976580SPhilippe Mathieu-Daudé             nbd_export_close(export);
12189d976580SPhilippe Mathieu-Daudé             nbd_export_put(export);
12199d976580SPhilippe Mathieu-Daudé             export = NULL;
12207860a380SPaolo Bonzini         }
12217860a380SPaolo Bonzini     } while (state != TERMINATED);
12222c8d9f06SPaolo Bonzini 
122326f54e9aSMarkus Armbruster     blk_unref(blk);
1224b32f6c28SPaolo Bonzini     if (sockpath) {
1225b32f6c28SPaolo Bonzini         unlink(sockpath);
1226b32f6c28SPaolo Bonzini     }
12277a5ca864Sbellard 
12288c116b0eSWenchao Xia     qemu_opts_del(sn_opts);
12298c116b0eSWenchao Xia 
1230a517e88bSPaolo Bonzini     if (device) {
1231a517e88bSPaolo Bonzini         void *ret;
1232a517e88bSPaolo Bonzini         pthread_join(client_thread, &ret);
1233a517e88bSPaolo Bonzini         exit(ret != NULL);
1234a517e88bSPaolo Bonzini     } else {
1235a517e88bSPaolo Bonzini         exit(EXIT_SUCCESS);
1236a517e88bSPaolo Bonzini     }
12377a5ca864Sbellard }
1238