1cd831bd7Sths /* 27a5ca864Sbellard * Copyright (C) 2005 Anthony Liguori <anthony@codemonkey.ws> 37a5ca864Sbellard * 47a5ca864Sbellard * Network Block Device 57a5ca864Sbellard * 67a5ca864Sbellard * This program is free software; you can redistribute it and/or modify 77a5ca864Sbellard * it under the terms of the GNU General Public License as published by 87a5ca864Sbellard * the Free Software Foundation; under version 2 of the License. 97a5ca864Sbellard * 107a5ca864Sbellard * This program is distributed in the hope that it will be useful, 117a5ca864Sbellard * but WITHOUT ANY WARRANTY; without even the implied warranty of 127a5ca864Sbellard * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the 137a5ca864Sbellard * GNU General Public License for more details. 147a5ca864Sbellard * 157a5ca864Sbellard * You should have received a copy of the GNU General Public License 168167ee88SBlue Swirl * along with this program; if not, see <http://www.gnu.org/licenses/>. 177a5ca864Sbellard */ 187a5ca864Sbellard 195a61cb60SStefan Weil #include "qemu-common.h" 20737e150eSPaolo Bonzini #include "block/block.h" 21737e150eSPaolo Bonzini #include "block/nbd.h" 226a1751b7SAlex Bligh #include "qemu/main-loop.h" 23537b41f5SPaolo Bonzini #include "qemu/sockets.h" 24537b41f5SPaolo Bonzini #include "qemu/error-report.h" 258c116b0eSWenchao Xia #include "block/snapshot.h" 267a5ca864Sbellard 277a5ca864Sbellard #include <stdarg.h> 287a5ca864Sbellard #include <stdio.h> 297a5ca864Sbellard #include <getopt.h> 307a5ca864Sbellard #include <err.h> 31cd831bd7Sths #include <sys/types.h> 327a5ca864Sbellard #include <sys/socket.h> 337a5ca864Sbellard #include <netinet/in.h> 347a5ca864Sbellard #include <netinet/tcp.h> 357a5ca864Sbellard #include <arpa/inet.h> 36cd831bd7Sths #include <signal.h> 372bff4b6fSBlue Swirl #include <libgen.h> 38a517e88bSPaolo Bonzini #include <pthread.h> 39cd831bd7Sths 40cd831bd7Sths #define SOCKET_PATH "/var/lock/qemu-nbd-%s" 4139a5235cSPaolo Bonzini #define QEMU_NBD_OPT_CACHE 1 4239a5235cSPaolo Bonzini #define QEMU_NBD_OPT_AIO 2 43ded9d2d5SPaolo Bonzini #define QEMU_NBD_OPT_DISCARD 3 447a5ca864Sbellard 45af49bbbeSPaolo Bonzini static NBDExport *exp; 46b1d8e52eSblueswir1 static int verbose; 47a517e88bSPaolo Bonzini static char *srcpath; 48a517e88bSPaolo Bonzini static char *sockpath; 497860a380SPaolo Bonzini static int persistent = 0; 507860a380SPaolo Bonzini static enum { RUNNING, TERMINATE, TERMINATING, TERMINATED } state; 51a61c6782SPaolo Bonzini static int shared = 1; 52a61c6782SPaolo Bonzini static int nb_fds; 537a5ca864Sbellard 547a5ca864Sbellard static void usage(const char *name) 557a5ca864Sbellard { 56b033cd86SPaolo Bonzini (printf) ( 577a5ca864Sbellard "Usage: %s [OPTIONS] FILE\n" 587a5ca864Sbellard "QEMU Disk Network Block Device Server\n" 597a5ca864Sbellard "\n" 607a5ca864Sbellard " -h, --help display this help and exit\n" 617a5ca864Sbellard " -V, --version output version information and exit\n" 627a5ca864Sbellard "\n" 63b033cd86SPaolo Bonzini "Connection properties:\n" 64b033cd86SPaolo Bonzini " -p, --port=PORT port to listen on (default `%d')\n" 65b033cd86SPaolo Bonzini " -b, --bind=IFACE interface to bind to (default `0.0.0.0')\n" 66b033cd86SPaolo Bonzini " -k, --socket=PATH path to the unix socket\n" 67b033cd86SPaolo Bonzini " (default '"SOCKET_PATH"')\n" 68b033cd86SPaolo Bonzini " -e, --shared=NUM device can be shared by NUM clients (default '1')\n" 69b033cd86SPaolo Bonzini " -t, --persistent don't exit on the last connection\n" 70b033cd86SPaolo Bonzini " -v, --verbose display extra debugging information\n" 71b033cd86SPaolo Bonzini "\n" 72b033cd86SPaolo Bonzini "Exposing part of the image:\n" 73b033cd86SPaolo Bonzini " -o, --offset=OFFSET offset into the image\n" 74b033cd86SPaolo Bonzini " -P, --partition=NUM only expose partition NUM\n" 75b033cd86SPaolo Bonzini "\n" 76b033cd86SPaolo Bonzini #ifdef __linux__ 77b033cd86SPaolo Bonzini "Kernel NBD client support:\n" 78b033cd86SPaolo Bonzini " -c, --connect=DEV connect FILE to the local NBD device DEV\n" 79b033cd86SPaolo Bonzini " -d, --disconnect disconnect the specified device\n" 80b033cd86SPaolo Bonzini "\n" 81b033cd86SPaolo Bonzini #endif 82b033cd86SPaolo Bonzini "\n" 83b033cd86SPaolo Bonzini "Block device options:\n" 844323fdcfSWenchao Xia " -f, --format=FORMAT set image format (raw, qcow2, ...)\n" 85b033cd86SPaolo Bonzini " -r, --read-only export read-only\n" 868c116b0eSWenchao Xia " -s, --snapshot use FILE as an external snapshot, create a temporary\n" 878c116b0eSWenchao Xia " file with backing_file=FILE, redirect the write to\n" 888c116b0eSWenchao Xia " the temporary one\n" 898c116b0eSWenchao Xia " -l, --load-snapshot=SNAPSHOT_PARAM\n" 908c116b0eSWenchao Xia " load an internal snapshot inside FILE and export it\n" 918c116b0eSWenchao Xia " as an read-only device, SNAPSHOT_PARAM format is\n" 928c116b0eSWenchao Xia " 'snapshot.id=[ID],snapshot.name=[NAME]', or\n" 938c116b0eSWenchao Xia " '[ID_OR_NAME]'\n" 94b033cd86SPaolo Bonzini " -n, --nocache disable host cache\n" 9539a5235cSPaolo Bonzini " --cache=MODE set cache mode (none, writeback, ...)\n" 9639a5235cSPaolo Bonzini #ifdef CONFIG_LINUX_AIO 9739a5235cSPaolo Bonzini " --aio=MODE set AIO mode (native or threads)\n" 9839a5235cSPaolo Bonzini #endif 99b033cd86SPaolo Bonzini "\n" 100b033cd86SPaolo Bonzini "Report bugs to <qemu-devel@nongnu.org>\n" 101c2e2872bSLaurent Vivier , name, NBD_DEFAULT_PORT, "DEVICE"); 1027a5ca864Sbellard } 1037a5ca864Sbellard 1047a5ca864Sbellard static void version(const char *name) 1057a5ca864Sbellard { 1067a5ca864Sbellard printf( 107315bc7aaSths "%s version 0.0.1\n" 1087a5ca864Sbellard "Written by Anthony Liguori.\n" 1097a5ca864Sbellard "\n" 1107a5ca864Sbellard "Copyright (C) 2006 Anthony Liguori <anthony@codemonkey.ws>.\n" 1117a5ca864Sbellard "This is free software; see the source for copying conditions. There is NO\n" 1127a5ca864Sbellard "warranty; not even for MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.\n" 113315bc7aaSths , name); 1147a5ca864Sbellard } 1157a5ca864Sbellard 1167a5ca864Sbellard struct partition_record 1177a5ca864Sbellard { 1187a5ca864Sbellard uint8_t bootable; 1197a5ca864Sbellard uint8_t start_head; 1207a5ca864Sbellard uint32_t start_cylinder; 1217a5ca864Sbellard uint8_t start_sector; 1227a5ca864Sbellard uint8_t system; 1237a5ca864Sbellard uint8_t end_head; 1247a5ca864Sbellard uint8_t end_cylinder; 1257a5ca864Sbellard uint8_t end_sector; 1267a5ca864Sbellard uint32_t start_sector_abs; 1277a5ca864Sbellard uint32_t nb_sectors_abs; 1287a5ca864Sbellard }; 1297a5ca864Sbellard 1307a5ca864Sbellard static void read_partition(uint8_t *p, struct partition_record *r) 1317a5ca864Sbellard { 1327a5ca864Sbellard r->bootable = p[0]; 1337a5ca864Sbellard r->start_head = p[1]; 1347a5ca864Sbellard r->start_cylinder = p[3] | ((p[2] << 2) & 0x0300); 1357a5ca864Sbellard r->start_sector = p[2] & 0x3f; 1367a5ca864Sbellard r->system = p[4]; 1377a5ca864Sbellard r->end_head = p[5]; 1387a5ca864Sbellard r->end_cylinder = p[7] | ((p[6] << 2) & 0x300); 1397a5ca864Sbellard r->end_sector = p[6] & 0x3f; 1407a5ca864Sbellard r->start_sector_abs = p[8] | p[9] << 8 | p[10] << 16 | p[11] << 24; 1417a5ca864Sbellard r->nb_sectors_abs = p[12] | p[13] << 8 | p[14] << 16 | p[15] << 24; 1427a5ca864Sbellard } 1437a5ca864Sbellard 1447a5ca864Sbellard static int find_partition(BlockDriverState *bs, int partition, 1457a5ca864Sbellard off_t *offset, off_t *size) 1467a5ca864Sbellard { 1477a5ca864Sbellard struct partition_record mbr[4]; 1487a5ca864Sbellard uint8_t data[512]; 1497a5ca864Sbellard int i; 1507a5ca864Sbellard int ext_partnum = 4; 151cb7cf0e3SRyota Ozaki int ret; 1527a5ca864Sbellard 153cb7cf0e3SRyota Ozaki if ((ret = bdrv_read(bs, 0, data, 1)) < 0) { 154cb7cf0e3SRyota Ozaki errno = -ret; 155cb7cf0e3SRyota Ozaki err(EXIT_FAILURE, "error while reading"); 156cb7cf0e3SRyota Ozaki } 1577a5ca864Sbellard 1587a5ca864Sbellard if (data[510] != 0x55 || data[511] != 0xaa) { 159185b4338SPaolo Bonzini return -EINVAL; 1607a5ca864Sbellard } 1617a5ca864Sbellard 1627a5ca864Sbellard for (i = 0; i < 4; i++) { 1637a5ca864Sbellard read_partition(&data[446 + 16 * i], &mbr[i]); 1647a5ca864Sbellard 1657a5ca864Sbellard if (!mbr[i].nb_sectors_abs) 1667a5ca864Sbellard continue; 1677a5ca864Sbellard 1687a5ca864Sbellard if (mbr[i].system == 0xF || mbr[i].system == 0x5) { 1697a5ca864Sbellard struct partition_record ext[4]; 1707a5ca864Sbellard uint8_t data1[512]; 1717a5ca864Sbellard int j; 1727a5ca864Sbellard 173cb7cf0e3SRyota Ozaki if ((ret = bdrv_read(bs, mbr[i].start_sector_abs, data1, 1)) < 0) { 174cb7cf0e3SRyota Ozaki errno = -ret; 175cb7cf0e3SRyota Ozaki err(EXIT_FAILURE, "error while reading"); 176cb7cf0e3SRyota Ozaki } 1777a5ca864Sbellard 1787a5ca864Sbellard for (j = 0; j < 4; j++) { 1797a5ca864Sbellard read_partition(&data1[446 + 16 * j], &ext[j]); 1807a5ca864Sbellard if (!ext[j].nb_sectors_abs) 1817a5ca864Sbellard continue; 1827a5ca864Sbellard 1837a5ca864Sbellard if ((ext_partnum + j + 1) == partition) { 1847a5ca864Sbellard *offset = (uint64_t)ext[j].start_sector_abs << 9; 1857a5ca864Sbellard *size = (uint64_t)ext[j].nb_sectors_abs << 9; 1867a5ca864Sbellard return 0; 1877a5ca864Sbellard } 1887a5ca864Sbellard } 1897a5ca864Sbellard ext_partnum += 4; 1907a5ca864Sbellard } else if ((i + 1) == partition) { 1917a5ca864Sbellard *offset = (uint64_t)mbr[i].start_sector_abs << 9; 1927a5ca864Sbellard *size = (uint64_t)mbr[i].nb_sectors_abs << 9; 1937a5ca864Sbellard return 0; 1947a5ca864Sbellard } 1957a5ca864Sbellard } 1967a5ca864Sbellard 197185b4338SPaolo Bonzini return -ENOENT; 1987a5ca864Sbellard } 1997a5ca864Sbellard 200bb345110SPaolo Bonzini static void termsig_handler(int signum) 201bb345110SPaolo Bonzini { 2027860a380SPaolo Bonzini state = TERMINATE; 203a61c6782SPaolo Bonzini qemu_notify_event(); 204bb345110SPaolo Bonzini } 205bb345110SPaolo Bonzini 206537b41f5SPaolo Bonzini static void combine_addr(char *buf, size_t len, const char* address, 207537b41f5SPaolo Bonzini uint16_t port) 208537b41f5SPaolo Bonzini { 209537b41f5SPaolo Bonzini /* If the address-part contains a colon, it's an IPv6 IP so needs [] */ 210537b41f5SPaolo Bonzini if (strstr(address, ":")) { 211537b41f5SPaolo Bonzini snprintf(buf, len, "[%s]:%u", address, port); 212537b41f5SPaolo Bonzini } else { 213537b41f5SPaolo Bonzini snprintf(buf, len, "%s:%u", address, port); 214537b41f5SPaolo Bonzini } 215537b41f5SPaolo Bonzini } 216537b41f5SPaolo Bonzini 217537b41f5SPaolo Bonzini static int tcp_socket_incoming(const char *address, uint16_t port) 218537b41f5SPaolo Bonzini { 219537b41f5SPaolo Bonzini char address_and_port[128]; 220537b41f5SPaolo Bonzini Error *local_err = NULL; 221537b41f5SPaolo Bonzini 222537b41f5SPaolo Bonzini combine_addr(address_and_port, 128, address, port); 223537b41f5SPaolo Bonzini int fd = inet_listen(address_and_port, NULL, 0, SOCK_STREAM, 0, &local_err); 224537b41f5SPaolo Bonzini 225537b41f5SPaolo Bonzini if (local_err != NULL) { 2263775ec6fSMarkus Armbruster error_report("%s", error_get_pretty(local_err)); 227537b41f5SPaolo Bonzini error_free(local_err); 228537b41f5SPaolo Bonzini } 229537b41f5SPaolo Bonzini return fd; 230537b41f5SPaolo Bonzini } 231537b41f5SPaolo Bonzini 232537b41f5SPaolo Bonzini static int unix_socket_incoming(const char *path) 233537b41f5SPaolo Bonzini { 234537b41f5SPaolo Bonzini Error *local_err = NULL; 235537b41f5SPaolo Bonzini int fd = unix_listen(path, NULL, 0, &local_err); 236537b41f5SPaolo Bonzini 237537b41f5SPaolo Bonzini if (local_err != NULL) { 2383775ec6fSMarkus Armbruster error_report("%s", error_get_pretty(local_err)); 239537b41f5SPaolo Bonzini error_free(local_err); 240537b41f5SPaolo Bonzini } 241537b41f5SPaolo Bonzini return fd; 242537b41f5SPaolo Bonzini } 243537b41f5SPaolo Bonzini 244537b41f5SPaolo Bonzini static int unix_socket_outgoing(const char *path) 245537b41f5SPaolo Bonzini { 246537b41f5SPaolo Bonzini Error *local_err = NULL; 247537b41f5SPaolo Bonzini int fd = unix_connect(path, &local_err); 248537b41f5SPaolo Bonzini 249537b41f5SPaolo Bonzini if (local_err != NULL) { 2503775ec6fSMarkus Armbruster error_report("%s", error_get_pretty(local_err)); 251537b41f5SPaolo Bonzini error_free(local_err); 252537b41f5SPaolo Bonzini } 253537b41f5SPaolo Bonzini return fd; 254537b41f5SPaolo Bonzini } 255537b41f5SPaolo Bonzini 256a517e88bSPaolo Bonzini static void *show_parts(void *arg) 257cd831bd7Sths { 258a6ac2313SPaolo Bonzini char *device = arg; 259cd831bd7Sths int nbd; 260cd831bd7Sths 261cd831bd7Sths /* linux just needs an open() to trigger 262cd831bd7Sths * the partition table update 263cd831bd7Sths * but remember to load the module with max_part != 0 : 264cd831bd7Sths * modprobe nbd max_part=63 265cd831bd7Sths */ 266cd831bd7Sths nbd = open(device, O_RDWR); 267fc19f8a0SPaolo Bonzini if (nbd >= 0) { 268cd831bd7Sths close(nbd); 269cd831bd7Sths } 270a517e88bSPaolo Bonzini return NULL; 271a517e88bSPaolo Bonzini } 272a517e88bSPaolo Bonzini 273a517e88bSPaolo Bonzini static void *nbd_client_thread(void *arg) 274a517e88bSPaolo Bonzini { 275a6ac2313SPaolo Bonzini char *device = arg; 276a517e88bSPaolo Bonzini off_t size; 277a517e88bSPaolo Bonzini size_t blocksize; 278a517e88bSPaolo Bonzini uint32_t nbdflags; 279a6ac2313SPaolo Bonzini int fd, sock; 280a517e88bSPaolo Bonzini int ret; 281a517e88bSPaolo Bonzini pthread_t show_parts_thread; 282a517e88bSPaolo Bonzini 283a517e88bSPaolo Bonzini sock = unix_socket_outgoing(sockpath); 284fc19f8a0SPaolo Bonzini if (sock < 0) { 285a517e88bSPaolo Bonzini goto out; 286a517e88bSPaolo Bonzini } 287a517e88bSPaolo Bonzini 288a517e88bSPaolo Bonzini ret = nbd_receive_negotiate(sock, NULL, &nbdflags, 289a517e88bSPaolo Bonzini &size, &blocksize); 290fc19f8a0SPaolo Bonzini if (ret < 0) { 2910c544d73SPaolo Bonzini goto out_socket; 292a517e88bSPaolo Bonzini } 293a517e88bSPaolo Bonzini 294a6ac2313SPaolo Bonzini fd = open(device, O_RDWR); 295fc19f8a0SPaolo Bonzini if (fd < 0) { 296a6ac2313SPaolo Bonzini /* Linux-only, we can use %m in printf. */ 2975672ee54SHani Benhabiles fprintf(stderr, "Failed to open %s: %m\n", device); 2980c544d73SPaolo Bonzini goto out_socket; 299a6ac2313SPaolo Bonzini } 300a6ac2313SPaolo Bonzini 301a517e88bSPaolo Bonzini ret = nbd_init(fd, sock, nbdflags, size, blocksize); 302fc19f8a0SPaolo Bonzini if (ret < 0) { 3030c544d73SPaolo Bonzini goto out_fd; 304a517e88bSPaolo Bonzini } 305a517e88bSPaolo Bonzini 306a517e88bSPaolo Bonzini /* update partition table */ 307a6ac2313SPaolo Bonzini pthread_create(&show_parts_thread, NULL, show_parts, device); 308a517e88bSPaolo Bonzini 309c1f8fdc3SPaolo Bonzini if (verbose) { 310a517e88bSPaolo Bonzini fprintf(stderr, "NBD device %s is now connected to %s\n", 311a517e88bSPaolo Bonzini device, srcpath); 312c1f8fdc3SPaolo Bonzini } else { 313c1f8fdc3SPaolo Bonzini /* Close stderr so that the qemu-nbd process exits. */ 314c1f8fdc3SPaolo Bonzini dup2(STDOUT_FILENO, STDERR_FILENO); 315c1f8fdc3SPaolo Bonzini } 316a517e88bSPaolo Bonzini 317a517e88bSPaolo Bonzini ret = nbd_client(fd); 318a517e88bSPaolo Bonzini if (ret) { 3190c544d73SPaolo Bonzini goto out_fd; 320a517e88bSPaolo Bonzini } 321a517e88bSPaolo Bonzini close(fd); 322a517e88bSPaolo Bonzini kill(getpid(), SIGTERM); 323a517e88bSPaolo Bonzini return (void *) EXIT_SUCCESS; 324a517e88bSPaolo Bonzini 3250c544d73SPaolo Bonzini out_fd: 3260c544d73SPaolo Bonzini close(fd); 3270c544d73SPaolo Bonzini out_socket: 3280c544d73SPaolo Bonzini closesocket(sock); 329a517e88bSPaolo Bonzini out: 330a517e88bSPaolo Bonzini kill(getpid(), SIGTERM); 331a517e88bSPaolo Bonzini return (void *) EXIT_FAILURE; 332cd831bd7Sths } 333cd831bd7Sths 334a61c6782SPaolo Bonzini static int nbd_can_accept(void *opaque) 335a61c6782SPaolo Bonzini { 336a61c6782SPaolo Bonzini return nb_fds < shared; 337a61c6782SPaolo Bonzini } 338a61c6782SPaolo Bonzini 3397860a380SPaolo Bonzini static void nbd_export_closed(NBDExport *exp) 3407860a380SPaolo Bonzini { 3417860a380SPaolo Bonzini assert(state == TERMINATING); 3427860a380SPaolo Bonzini state = TERMINATED; 3437860a380SPaolo Bonzini } 3447860a380SPaolo Bonzini 3451743b515SPaolo Bonzini static void nbd_client_closed(NBDClient *client) 346a61c6782SPaolo Bonzini { 347a61c6782SPaolo Bonzini nb_fds--; 3487860a380SPaolo Bonzini if (nb_fds == 0 && !persistent && state == RUNNING) { 3497860a380SPaolo Bonzini state = TERMINATE; 3507860a380SPaolo Bonzini } 3511743b515SPaolo Bonzini qemu_notify_event(); 3527860a380SPaolo Bonzini nbd_client_put(client); 353a61c6782SPaolo Bonzini } 354a61c6782SPaolo Bonzini 355a61c6782SPaolo Bonzini static void nbd_accept(void *opaque) 356a61c6782SPaolo Bonzini { 357a61c6782SPaolo Bonzini int server_fd = (uintptr_t) opaque; 358a61c6782SPaolo Bonzini struct sockaddr_in addr; 359a61c6782SPaolo Bonzini socklen_t addr_len = sizeof(addr); 360a61c6782SPaolo Bonzini 361a61c6782SPaolo Bonzini int fd = accept(server_fd, (struct sockaddr *)&addr, &addr_len); 3620c544d73SPaolo Bonzini if (fd < 0) { 3630c544d73SPaolo Bonzini perror("accept"); 3640c544d73SPaolo Bonzini return; 3650c544d73SPaolo Bonzini } 3660c544d73SPaolo Bonzini 3677860a380SPaolo Bonzini if (state >= TERMINATE) { 3687860a380SPaolo Bonzini close(fd); 3697860a380SPaolo Bonzini return; 3707860a380SPaolo Bonzini } 3717860a380SPaolo Bonzini 37236af5994SHani Benhabiles if (nbd_client_new(exp, fd, nbd_client_closed)) { 373a61c6782SPaolo Bonzini nb_fds++; 37436af5994SHani Benhabiles } else { 375*27e5eae4SHani Benhabiles shutdown(fd, 2); 37636af5994SHani Benhabiles close(fd); 377a61c6782SPaolo Bonzini } 378a61c6782SPaolo Bonzini } 379a61c6782SPaolo Bonzini 3807a5ca864Sbellard int main(int argc, char **argv) 3817a5ca864Sbellard { 3827a5ca864Sbellard BlockDriverState *bs; 383e6b63677SDaniel P. Berrange BlockDriver *drv; 3847a5ca864Sbellard off_t dev_offset = 0; 385b90fb4b8SPaolo Bonzini uint32_t nbdflags = 0; 386cd831bd7Sths bool disconnect = false; 3877a5ca864Sbellard const char *bindto = "0.0.0.0"; 388a6ac2313SPaolo Bonzini char *device = NULL; 389c2e2872bSLaurent Vivier int port = NBD_DEFAULT_PORT; 3907a5ca864Sbellard off_t fd_size; 3918c116b0eSWenchao Xia QemuOpts *sn_opts = NULL; 3928c116b0eSWenchao Xia const char *sn_id_or_name = NULL; 3938c116b0eSWenchao Xia const char *sopt = "hVb:o:p:rsnP:c:dvk:e:f:tl:"; 3947a5ca864Sbellard struct option lopt[] = { 395660f11beSBlue Swirl { "help", 0, NULL, 'h' }, 396660f11beSBlue Swirl { "version", 0, NULL, 'V' }, 397660f11beSBlue Swirl { "bind", 1, NULL, 'b' }, 398660f11beSBlue Swirl { "port", 1, NULL, 'p' }, 399660f11beSBlue Swirl { "socket", 1, NULL, 'k' }, 400660f11beSBlue Swirl { "offset", 1, NULL, 'o' }, 401660f11beSBlue Swirl { "read-only", 0, NULL, 'r' }, 402660f11beSBlue Swirl { "partition", 1, NULL, 'P' }, 403660f11beSBlue Swirl { "connect", 1, NULL, 'c' }, 404660f11beSBlue Swirl { "disconnect", 0, NULL, 'd' }, 405660f11beSBlue Swirl { "snapshot", 0, NULL, 's' }, 4068c116b0eSWenchao Xia { "load-snapshot", 1, NULL, 'l' }, 407660f11beSBlue Swirl { "nocache", 0, NULL, 'n' }, 40839a5235cSPaolo Bonzini { "cache", 1, NULL, QEMU_NBD_OPT_CACHE }, 40939a5235cSPaolo Bonzini #ifdef CONFIG_LINUX_AIO 41039a5235cSPaolo Bonzini { "aio", 1, NULL, QEMU_NBD_OPT_AIO }, 41139a5235cSPaolo Bonzini #endif 412ded9d2d5SPaolo Bonzini { "discard", 1, NULL, QEMU_NBD_OPT_DISCARD }, 413660f11beSBlue Swirl { "shared", 1, NULL, 'e' }, 414e6b63677SDaniel P. Berrange { "format", 1, NULL, 'f' }, 415660f11beSBlue Swirl { "persistent", 0, NULL, 't' }, 416660f11beSBlue Swirl { "verbose", 0, NULL, 'v' }, 417660f11beSBlue Swirl { NULL, 0, NULL, 0 } 4187a5ca864Sbellard }; 4197a5ca864Sbellard int ch; 4207a5ca864Sbellard int opt_ind = 0; 4217a5ca864Sbellard int li; 4227a5ca864Sbellard char *end; 423f5edb014SNaphtali Sprei int flags = BDRV_O_RDWR; 4247a5ca864Sbellard int partition = -1; 425cd831bd7Sths int ret; 4263b05a8e9Sths int fd; 42739a5235cSPaolo Bonzini bool seen_cache = false; 428ded9d2d5SPaolo Bonzini bool seen_discard = false; 42939a5235cSPaolo Bonzini #ifdef CONFIG_LINUX_AIO 43039a5235cSPaolo Bonzini bool seen_aio = false; 43139a5235cSPaolo Bonzini #endif 432a517e88bSPaolo Bonzini pthread_t client_thread; 433e6b63677SDaniel P. Berrange const char *fmt = NULL; 43434b5d2c6SMax Reitz Error *local_err = NULL; 4357a5ca864Sbellard 436a517e88bSPaolo Bonzini /* The client thread uses SIGTERM to interrupt the server. A signal 437a517e88bSPaolo Bonzini * handler ensures that "qemu-nbd -v -c" exits with a nice status code. 438a517e88bSPaolo Bonzini */ 439bb345110SPaolo Bonzini struct sigaction sa_sigterm; 440bb345110SPaolo Bonzini memset(&sa_sigterm, 0, sizeof(sa_sigterm)); 441bb345110SPaolo Bonzini sa_sigterm.sa_handler = termsig_handler; 442bb345110SPaolo Bonzini sigaction(SIGTERM, &sa_sigterm, NULL); 44310f5bff6SFam Zheng qemu_init_exec_dir(argv[0]); 444bb345110SPaolo Bonzini 4457a5ca864Sbellard while ((ch = getopt_long(argc, argv, sopt, lopt, &opt_ind)) != -1) { 4467a5ca864Sbellard switch (ch) { 4477a5ca864Sbellard case 's': 4482f726488Sths flags |= BDRV_O_SNAPSHOT; 4492f726488Sths break; 4502f726488Sths case 'n': 45139a5235cSPaolo Bonzini optarg = (char *) "none"; 45239a5235cSPaolo Bonzini /* fallthrough */ 45339a5235cSPaolo Bonzini case QEMU_NBD_OPT_CACHE: 45439a5235cSPaolo Bonzini if (seen_cache) { 45539a5235cSPaolo Bonzini errx(EXIT_FAILURE, "-n and --cache can only be specified once"); 45639a5235cSPaolo Bonzini } 45739a5235cSPaolo Bonzini seen_cache = true; 45839a5235cSPaolo Bonzini if (bdrv_parse_cache_flags(optarg, &flags) == -1) { 45939a5235cSPaolo Bonzini errx(EXIT_FAILURE, "Invalid cache mode `%s'", optarg); 46039a5235cSPaolo Bonzini } 4617a5ca864Sbellard break; 46239a5235cSPaolo Bonzini #ifdef CONFIG_LINUX_AIO 46339a5235cSPaolo Bonzini case QEMU_NBD_OPT_AIO: 46439a5235cSPaolo Bonzini if (seen_aio) { 46539a5235cSPaolo Bonzini errx(EXIT_FAILURE, "--aio can only be specified once"); 46639a5235cSPaolo Bonzini } 46739a5235cSPaolo Bonzini seen_aio = true; 46839a5235cSPaolo Bonzini if (!strcmp(optarg, "native")) { 46939a5235cSPaolo Bonzini flags |= BDRV_O_NATIVE_AIO; 47039a5235cSPaolo Bonzini } else if (!strcmp(optarg, "threads")) { 47139a5235cSPaolo Bonzini /* this is the default */ 47239a5235cSPaolo Bonzini } else { 47339a5235cSPaolo Bonzini errx(EXIT_FAILURE, "invalid aio mode `%s'", optarg); 47439a5235cSPaolo Bonzini } 47539a5235cSPaolo Bonzini break; 47639a5235cSPaolo Bonzini #endif 477ded9d2d5SPaolo Bonzini case QEMU_NBD_OPT_DISCARD: 478ded9d2d5SPaolo Bonzini if (seen_discard) { 479ded9d2d5SPaolo Bonzini errx(EXIT_FAILURE, "--discard can only be specified once"); 480ded9d2d5SPaolo Bonzini } 481ded9d2d5SPaolo Bonzini seen_discard = true; 482ded9d2d5SPaolo Bonzini if (bdrv_parse_discard_flags(optarg, &flags) == -1) { 483ded9d2d5SPaolo Bonzini errx(EXIT_FAILURE, "Invalid discard mode `%s'", optarg); 484ded9d2d5SPaolo Bonzini } 485ded9d2d5SPaolo Bonzini break; 4867a5ca864Sbellard case 'b': 4877a5ca864Sbellard bindto = optarg; 4887a5ca864Sbellard break; 4897a5ca864Sbellard case 'p': 4907a5ca864Sbellard li = strtol(optarg, &end, 0); 4917a5ca864Sbellard if (*end) { 492b6353beaSRyota Ozaki errx(EXIT_FAILURE, "Invalid port `%s'", optarg); 4937a5ca864Sbellard } 4947a5ca864Sbellard if (li < 1 || li > 65535) { 495b6353beaSRyota Ozaki errx(EXIT_FAILURE, "Port out of range `%s'", optarg); 4967a5ca864Sbellard } 4977a5ca864Sbellard port = (uint16_t)li; 4987a5ca864Sbellard break; 4997a5ca864Sbellard case 'o': 5007a5ca864Sbellard dev_offset = strtoll (optarg, &end, 0); 5017a5ca864Sbellard if (*end) { 502b6353beaSRyota Ozaki errx(EXIT_FAILURE, "Invalid offset `%s'", optarg); 5037a5ca864Sbellard } 5047a5ca864Sbellard if (dev_offset < 0) { 505b6353beaSRyota Ozaki errx(EXIT_FAILURE, "Offset must be positive `%s'", optarg); 5067a5ca864Sbellard } 5077a5ca864Sbellard break; 5088c116b0eSWenchao Xia case 'l': 5098c116b0eSWenchao Xia if (strstart(optarg, SNAPSHOT_OPT_BASE, NULL)) { 5108c116b0eSWenchao Xia sn_opts = qemu_opts_parse(&internal_snapshot_opts, optarg, 0); 5118c116b0eSWenchao Xia if (!sn_opts) { 5128c116b0eSWenchao Xia errx(EXIT_FAILURE, "Failed in parsing snapshot param `%s'", 5138c116b0eSWenchao Xia optarg); 5148c116b0eSWenchao Xia } 5158c116b0eSWenchao Xia } else { 5168c116b0eSWenchao Xia sn_id_or_name = optarg; 5178c116b0eSWenchao Xia } 5188c116b0eSWenchao Xia /* fall through */ 5197a5ca864Sbellard case 'r': 520b90fb4b8SPaolo Bonzini nbdflags |= NBD_FLAG_READ_ONLY; 52107108b29SNaphtali Sprei flags &= ~BDRV_O_RDWR; 5227a5ca864Sbellard break; 5237a5ca864Sbellard case 'P': 5247a5ca864Sbellard partition = strtol(optarg, &end, 0); 5257a5ca864Sbellard if (*end) 526b6353beaSRyota Ozaki errx(EXIT_FAILURE, "Invalid partition `%s'", optarg); 5277a5ca864Sbellard if (partition < 1 || partition > 8) 528b6353beaSRyota Ozaki errx(EXIT_FAILURE, "Invalid partition %d", partition); 5297a5ca864Sbellard break; 530cd831bd7Sths case 'k': 531b32f6c28SPaolo Bonzini sockpath = optarg; 532b32f6c28SPaolo Bonzini if (sockpath[0] != '/') 533b6353beaSRyota Ozaki errx(EXIT_FAILURE, "socket path must be absolute\n"); 534cd831bd7Sths break; 535cd831bd7Sths case 'd': 536cd831bd7Sths disconnect = true; 537cd831bd7Sths break; 538cd831bd7Sths case 'c': 539cd831bd7Sths device = optarg; 540cd831bd7Sths break; 5413b05a8e9Sths case 'e': 5423b05a8e9Sths shared = strtol(optarg, &end, 0); 5433b05a8e9Sths if (*end) { 544b6353beaSRyota Ozaki errx(EXIT_FAILURE, "Invalid shared device number '%s'", optarg); 5453b05a8e9Sths } 5463b05a8e9Sths if (shared < 1) { 547b6353beaSRyota Ozaki errx(EXIT_FAILURE, "Shared device number must be greater than 0\n"); 5483b05a8e9Sths } 5493b05a8e9Sths break; 550e6b63677SDaniel P. Berrange case 'f': 551e6b63677SDaniel P. Berrange fmt = optarg; 552e6b63677SDaniel P. Berrange break; 55375818250Sths case 't': 55475818250Sths persistent = 1; 55575818250Sths break; 5567a5ca864Sbellard case 'v': 5577a5ca864Sbellard verbose = 1; 5587a5ca864Sbellard break; 5597a5ca864Sbellard case 'V': 5607a5ca864Sbellard version(argv[0]); 5617a5ca864Sbellard exit(0); 5627a5ca864Sbellard break; 5637a5ca864Sbellard case 'h': 5647a5ca864Sbellard usage(argv[0]); 5657a5ca864Sbellard exit(0); 5667a5ca864Sbellard break; 5677a5ca864Sbellard case '?': 568b6353beaSRyota Ozaki errx(EXIT_FAILURE, "Try `%s --help' for more information.", 5697a5ca864Sbellard argv[0]); 5707a5ca864Sbellard } 5717a5ca864Sbellard } 5727a5ca864Sbellard 5737a5ca864Sbellard if ((argc - optind) != 1) { 574b6353beaSRyota Ozaki errx(EXIT_FAILURE, "Invalid number of argument.\n" 5757a5ca864Sbellard "Try `%s --help' for more information.", 5767a5ca864Sbellard argv[0]); 5777a5ca864Sbellard } 5787a5ca864Sbellard 579cd831bd7Sths if (disconnect) { 580cd831bd7Sths fd = open(argv[optind], O_RDWR); 581fc19f8a0SPaolo Bonzini if (fd < 0) { 582cb7cf0e3SRyota Ozaki err(EXIT_FAILURE, "Cannot open %s", argv[optind]); 583fc19f8a0SPaolo Bonzini } 584cd831bd7Sths nbd_disconnect(fd); 585cd831bd7Sths 586cd831bd7Sths close(fd); 587cd831bd7Sths 588cd831bd7Sths printf("%s disconnected\n", argv[optind]); 589cd831bd7Sths 590cd831bd7Sths return 0; 591cd831bd7Sths } 592cd831bd7Sths 593c1f8fdc3SPaolo Bonzini if (device && !verbose) { 594c1f8fdc3SPaolo Bonzini int stderr_fd[2]; 595c1f8fdc3SPaolo Bonzini pid_t pid; 596c1f8fdc3SPaolo Bonzini int ret; 597c1f8fdc3SPaolo Bonzini 598fc19f8a0SPaolo Bonzini if (qemu_pipe(stderr_fd) < 0) { 599c1f8fdc3SPaolo Bonzini err(EXIT_FAILURE, "Error setting up communication pipe"); 600c1f8fdc3SPaolo Bonzini } 601c1f8fdc3SPaolo Bonzini 602c1f8fdc3SPaolo Bonzini /* Now daemonize, but keep a communication channel open to 603c1f8fdc3SPaolo Bonzini * print errors and exit with the proper status code. 604c1f8fdc3SPaolo Bonzini */ 605c1f8fdc3SPaolo Bonzini pid = fork(); 606c1f8fdc3SPaolo Bonzini if (pid == 0) { 607c1f8fdc3SPaolo Bonzini close(stderr_fd[0]); 6089faf31b6SMichael Tokarev ret = qemu_daemon(1, 0); 609c1f8fdc3SPaolo Bonzini 610c1f8fdc3SPaolo Bonzini /* Temporarily redirect stderr to the parent's pipe... */ 611c1f8fdc3SPaolo Bonzini dup2(stderr_fd[1], STDERR_FILENO); 612fc19f8a0SPaolo Bonzini if (ret < 0) { 613c1f8fdc3SPaolo Bonzini err(EXIT_FAILURE, "Failed to daemonize"); 614c1f8fdc3SPaolo Bonzini } 615c1f8fdc3SPaolo Bonzini 616c1f8fdc3SPaolo Bonzini /* ... close the descriptor we inherited and go on. */ 617c1f8fdc3SPaolo Bonzini close(stderr_fd[1]); 618c1f8fdc3SPaolo Bonzini } else { 619c1f8fdc3SPaolo Bonzini bool errors = false; 620c1f8fdc3SPaolo Bonzini char *buf; 621c1f8fdc3SPaolo Bonzini 622c1f8fdc3SPaolo Bonzini /* In the parent. Print error messages from the child until 623c1f8fdc3SPaolo Bonzini * it closes the pipe. 624c1f8fdc3SPaolo Bonzini */ 625c1f8fdc3SPaolo Bonzini close(stderr_fd[1]); 626c1f8fdc3SPaolo Bonzini buf = g_malloc(1024); 627c1f8fdc3SPaolo Bonzini while ((ret = read(stderr_fd[0], buf, 1024)) > 0) { 628c1f8fdc3SPaolo Bonzini errors = true; 629c1f8fdc3SPaolo Bonzini ret = qemu_write_full(STDERR_FILENO, buf, ret); 630fc19f8a0SPaolo Bonzini if (ret < 0) { 631c1f8fdc3SPaolo Bonzini exit(EXIT_FAILURE); 632c1f8fdc3SPaolo Bonzini } 633c1f8fdc3SPaolo Bonzini } 634fc19f8a0SPaolo Bonzini if (ret < 0) { 635c1f8fdc3SPaolo Bonzini err(EXIT_FAILURE, "Cannot read from daemon"); 636c1f8fdc3SPaolo Bonzini } 637c1f8fdc3SPaolo Bonzini 638c1f8fdc3SPaolo Bonzini /* Usually the daemon should not print any message. 639c1f8fdc3SPaolo Bonzini * Exit with zero status in that case. 640c1f8fdc3SPaolo Bonzini */ 641c1f8fdc3SPaolo Bonzini exit(errors); 642c1f8fdc3SPaolo Bonzini } 643c1f8fdc3SPaolo Bonzini } 644c1f8fdc3SPaolo Bonzini 645a6ac2313SPaolo Bonzini if (device != NULL && sockpath == NULL) { 646b32f6c28SPaolo Bonzini sockpath = g_malloc(128); 647b32f6c28SPaolo Bonzini snprintf(sockpath, 128, SOCKET_PATH, basename(device)); 648cd831bd7Sths } 649cd831bd7Sths 6507e7f4a0eSPaolo Bonzini qemu_init_main_loop(); 651802ddc37SPaolo Bonzini bdrv_init(); 652802ddc37SPaolo Bonzini atexit(bdrv_close_all); 653802ddc37SPaolo Bonzini 654e6b63677SDaniel P. Berrange if (fmt) { 655e6b63677SDaniel P. Berrange drv = bdrv_find_format(fmt); 656e6b63677SDaniel P. Berrange if (!drv) { 657e6b63677SDaniel P. Berrange errx(EXIT_FAILURE, "Unknown file format '%s'", fmt); 658e6b63677SDaniel P. Berrange } 659e6b63677SDaniel P. Berrange } else { 660e6b63677SDaniel P. Berrange drv = NULL; 661e6b63677SDaniel P. Berrange } 662e6b63677SDaniel P. Berrange 66398522f63SKevin Wolf bs = bdrv_new("hda", &error_abort); 66498522f63SKevin Wolf 665802ddc37SPaolo Bonzini srcpath = argv[optind]; 666ddf5636dSMax Reitz ret = bdrv_open(&bs, srcpath, NULL, NULL, flags, drv, &local_err); 667e6b63677SDaniel P. Berrange if (ret < 0) { 668802ddc37SPaolo Bonzini errno = -ret; 66934b5d2c6SMax Reitz err(EXIT_FAILURE, "Failed to bdrv_open '%s': %s", argv[optind], 67034b5d2c6SMax Reitz error_get_pretty(local_err)); 671802ddc37SPaolo Bonzini } 672802ddc37SPaolo Bonzini 6738c116b0eSWenchao Xia if (sn_opts) { 6748c116b0eSWenchao Xia ret = bdrv_snapshot_load_tmp(bs, 6758c116b0eSWenchao Xia qemu_opt_get(sn_opts, SNAPSHOT_OPT_ID), 6768c116b0eSWenchao Xia qemu_opt_get(sn_opts, SNAPSHOT_OPT_NAME), 6778c116b0eSWenchao Xia &local_err); 6788c116b0eSWenchao Xia } else if (sn_id_or_name) { 6798c116b0eSWenchao Xia ret = bdrv_snapshot_load_tmp_by_id_or_name(bs, sn_id_or_name, 6808c116b0eSWenchao Xia &local_err); 6818c116b0eSWenchao Xia } 6828c116b0eSWenchao Xia if (ret < 0) { 6838c116b0eSWenchao Xia errno = -ret; 6848c116b0eSWenchao Xia err(EXIT_FAILURE, 6858c116b0eSWenchao Xia "Failed to load snapshot: %s", 6868c116b0eSWenchao Xia error_get_pretty(local_err)); 6878c116b0eSWenchao Xia } 6888c116b0eSWenchao Xia 68938ceff04SPaolo Bonzini fd_size = bdrv_getlength(bs); 690802ddc37SPaolo Bonzini 691185b4338SPaolo Bonzini if (partition != -1) { 692185b4338SPaolo Bonzini ret = find_partition(bs, partition, &dev_offset, &fd_size); 693185b4338SPaolo Bonzini if (ret < 0) { 694185b4338SPaolo Bonzini errno = -ret; 695802ddc37SPaolo Bonzini err(EXIT_FAILURE, "Could not find partition %d", partition); 696802ddc37SPaolo Bonzini } 697185b4338SPaolo Bonzini } 698802ddc37SPaolo Bonzini 6997860a380SPaolo Bonzini exp = nbd_export_new(bs, dev_offset, fd_size, nbdflags, nbd_export_closed); 7003b05a8e9Sths 701b32f6c28SPaolo Bonzini if (sockpath) { 702a61c6782SPaolo Bonzini fd = unix_socket_incoming(sockpath); 703cd831bd7Sths } else { 704a61c6782SPaolo Bonzini fd = tcp_socket_incoming(bindto, port); 705cd831bd7Sths } 706cd831bd7Sths 707fc19f8a0SPaolo Bonzini if (fd < 0) { 7087a5ca864Sbellard return 1; 709a61c6782SPaolo Bonzini } 710f1ef5555SPaolo Bonzini 711f1ef5555SPaolo Bonzini if (device) { 712f1ef5555SPaolo Bonzini int ret; 713f1ef5555SPaolo Bonzini 714a6ac2313SPaolo Bonzini ret = pthread_create(&client_thread, NULL, nbd_client_thread, device); 715f1ef5555SPaolo Bonzini if (ret != 0) { 716f1ef5555SPaolo Bonzini errx(EXIT_FAILURE, "Failed to create client thread: %s", 717f1ef5555SPaolo Bonzini strerror(ret)); 718f1ef5555SPaolo Bonzini } 719f1ef5555SPaolo Bonzini } else { 720f1ef5555SPaolo Bonzini /* Shut up GCC warnings. */ 721f1ef5555SPaolo Bonzini memset(&client_thread, 0, sizeof(client_thread)); 722f1ef5555SPaolo Bonzini } 723f1ef5555SPaolo Bonzini 724a61c6782SPaolo Bonzini qemu_set_fd_handler2(fd, nbd_can_accept, nbd_accept, NULL, 725a61c6782SPaolo Bonzini (void *)(uintptr_t)fd); 7267a5ca864Sbellard 7279faf31b6SMichael Tokarev /* now when the initialization is (almost) complete, chdir("/") 7289faf31b6SMichael Tokarev * to free any busy filesystems */ 7299faf31b6SMichael Tokarev if (chdir("/") < 0) { 7309faf31b6SMichael Tokarev err(EXIT_FAILURE, "Could not chdir to root directory"); 7319faf31b6SMichael Tokarev } 7329faf31b6SMichael Tokarev 7337860a380SPaolo Bonzini state = RUNNING; 7343b05a8e9Sths do { 735a61c6782SPaolo Bonzini main_loop_wait(false); 7367860a380SPaolo Bonzini if (state == TERMINATE) { 7377860a380SPaolo Bonzini state = TERMINATING; 738af49bbbeSPaolo Bonzini nbd_export_close(exp); 7392c8d9f06SPaolo Bonzini nbd_export_put(exp); 7407860a380SPaolo Bonzini exp = NULL; 7417860a380SPaolo Bonzini } 7427860a380SPaolo Bonzini } while (state != TERMINATED); 7432c8d9f06SPaolo Bonzini 7447860a380SPaolo Bonzini bdrv_close(bs); 745b32f6c28SPaolo Bonzini if (sockpath) { 746b32f6c28SPaolo Bonzini unlink(sockpath); 747b32f6c28SPaolo Bonzini } 7487a5ca864Sbellard 7498c116b0eSWenchao Xia if (sn_opts) { 7508c116b0eSWenchao Xia qemu_opts_del(sn_opts); 7518c116b0eSWenchao Xia } 7528c116b0eSWenchao Xia 753a517e88bSPaolo Bonzini if (device) { 754a517e88bSPaolo Bonzini void *ret; 755a517e88bSPaolo Bonzini pthread_join(client_thread, &ret); 756a517e88bSPaolo Bonzini exit(ret != NULL); 757a517e88bSPaolo Bonzini } else { 758a517e88bSPaolo Bonzini exit(EXIT_SUCCESS); 759a517e88bSPaolo Bonzini } 7607a5ca864Sbellard } 761