xref: /kvmtool/builtin-run.c (revision e830cce7780a0d008fd00f6e5daba6dcc5e297d4)
1ece09f8fSPekka Enberg #include "kvm/builtin-run.h"
2ece09f8fSPekka Enberg 
3c8675741SSasha Levin #include "kvm/builtin-setup.h"
4ece09f8fSPekka Enberg #include "kvm/virtio-balloon.h"
5ece09f8fSPekka Enberg #include "kvm/virtio-console.h"
6ece09f8fSPekka Enberg #include "kvm/parse-options.h"
7ece09f8fSPekka Enberg #include "kvm/8250-serial.h"
8ece09f8fSPekka Enberg #include "kvm/framebuffer.h"
9ece09f8fSPekka Enberg #include "kvm/disk-image.h"
10ece09f8fSPekka Enberg #include "kvm/threadpool.h"
11a67da3beSAsias He #include "kvm/virtio-scsi.h"
12ece09f8fSPekka Enberg #include "kvm/virtio-blk.h"
13ece09f8fSPekka Enberg #include "kvm/virtio-net.h"
14ece09f8fSPekka Enberg #include "kvm/virtio-rng.h"
15ece09f8fSPekka Enberg #include "kvm/ioeventfd.h"
16ece09f8fSPekka Enberg #include "kvm/virtio-9p.h"
17ece09f8fSPekka Enberg #include "kvm/barrier.h"
18ece09f8fSPekka Enberg #include "kvm/kvm-cpu.h"
19ece09f8fSPekka Enberg #include "kvm/ioport.h"
20ece09f8fSPekka Enberg #include "kvm/symbol.h"
21ece09f8fSPekka Enberg #include "kvm/i8042.h"
22ece09f8fSPekka Enberg #include "kvm/mutex.h"
23ece09f8fSPekka Enberg #include "kvm/term.h"
24ece09f8fSPekka Enberg #include "kvm/util.h"
25ec52d504SLai Jiangshan #include "kvm/strbuf.h"
26ece09f8fSPekka Enberg #include "kvm/vesa.h"
27ece09f8fSPekka Enberg #include "kvm/irq.h"
28ece09f8fSPekka Enberg #include "kvm/kvm.h"
29ece09f8fSPekka Enberg #include "kvm/pci.h"
30ece09f8fSPekka Enberg #include "kvm/rtc.h"
31ece09f8fSPekka Enberg #include "kvm/sdl.h"
32ece09f8fSPekka Enberg #include "kvm/vnc.h"
33e6694207SSasha Levin #include "kvm/guest_compat.h"
3495d13a52SSasha Levin #include "kvm/pci-shmem.h"
354b1addaeSSasha Levin #include "kvm/kvm-ipc.h"
364b1c6f6eSSasha Levin #include "kvm/builtin-debug.h"
37ece09f8fSPekka Enberg 
38ece09f8fSPekka Enberg #include <linux/types.h>
3948d9e01aSSasha Levin #include <linux/err.h>
40ece09f8fSPekka Enberg 
418329f30bSPekka Enberg #include <sys/utsname.h>
428329f30bSPekka Enberg #include <sys/types.h>
438329f30bSPekka Enberg #include <sys/stat.h>
44ece09f8fSPekka Enberg #include <termios.h>
45ece09f8fSPekka Enberg #include <signal.h>
46ece09f8fSPekka Enberg #include <stdlib.h>
47ece09f8fSPekka Enberg #include <string.h>
48ece09f8fSPekka Enberg #include <unistd.h>
4926c853e4SPrasad Joshi #include <ctype.h>
50ece09f8fSPekka Enberg #include <stdio.h>
51f967c427SPrasad Joshi 
52f967c427SPrasad Joshi #define MB_SHIFT		(20)
5395d13a52SSasha Levin #define KB_SHIFT		(10)
5495d13a52SSasha Levin #define GB_SHIFT		(30)
55f967c427SPrasad Joshi 
564298ddadSSasha Levin struct kvm *kvm;
57e2077857SMatt Evans struct kvm_cpu **kvm_cpus;
58656be1b8SSasha Levin __thread struct kvm_cpu *current_kvm_cpu;
59f967c427SPrasad Joshi 
603c29e2aaSSasha Levin static int  kvm_run_wrapper;
61f967c427SPrasad Joshi extern int  active_console;
62aa400b00SPrasad Joshi extern int  debug_iodelay;
63f967c427SPrasad Joshi 
64ed036f03SCyrill Gorcunov bool do_debug_print = false;
65ed036f03SCyrill Gorcunov 
66cfd63bbbSSasha Levin static int nrcpus;
67890364f8SCyrill Gorcunov static int vidmode = -1;
68d77a9efaSCyrill Gorcunov 
69afc2c7c0SAsias He extern char _binary_guest_init_start;
70afc2c7c0SAsias He extern char _binary_guest_init_size;
71afc2c7c0SAsias He 
72f967c427SPrasad Joshi static const char * const run_usage[] = {
738d2ff5daSWanlong Gao 	"lkvm run [<options>] [<kernel image>]",
74f967c427SPrasad Joshi 	NULL
75f967c427SPrasad Joshi };
76f967c427SPrasad Joshi 
773c29e2aaSSasha Levin enum {
78e0747665SSasha Levin 	KVM_RUN_DEFAULT,
793c29e2aaSSasha Levin 	KVM_RUN_SANDBOX,
803c29e2aaSSasha Levin };
813c29e2aaSSasha Levin 
823c29e2aaSSasha Levin void kvm_run_set_wrapper_sandbox(void)
833c29e2aaSSasha Levin {
843c29e2aaSSasha Levin 	kvm_run_wrapper = KVM_RUN_SANDBOX;
853c29e2aaSSasha Levin }
863c29e2aaSSasha Levin 
87a33979d8SSasha Levin static int img_name_parser(const struct option *opt, const char *arg, int unset)
88a33979d8SSasha Levin {
8982d65b5eSSasha Levin 	char path[PATH_MAX];
905236b505SAsias He 	const char *cur;
915236b505SAsias He 	struct stat st;
925236b505SAsias He 	char *sep;
9359aa2d30SSasha Levin 
9459aa2d30SSasha Levin 	if (stat(arg, &st) == 0 &&
9559aa2d30SSasha Levin 	    S_ISDIR(st.st_mode)) {
9659aa2d30SSasha Levin 		char tmp[PATH_MAX];
9759aa2d30SSasha Levin 
9847621338SSasha Levin 		if (kvm->cfg.using_rootfs)
992c908af9SLai Jiangshan 			die("Please use only one rootfs directory atmost");
1002c908af9SLai Jiangshan 
10159aa2d30SSasha Levin 		if (realpath(arg, tmp) == 0 ||
102c7838fbdSSasha Levin 		    virtio_9p__register(kvm, tmp, "/dev/root") < 0)
10359aa2d30SSasha Levin 			die("Unable to initialize virtio 9p");
10447621338SSasha Levin 		kvm->cfg.using_rootfs = 1;
10559aa2d30SSasha Levin 		return 0;
10659aa2d30SSasha Levin 	}
107a33979d8SSasha Levin 
1089667701cSPekka Enberg 	snprintf(path, PATH_MAX, "%s%s", kvm__get_dir(), arg);
10982d65b5eSSasha Levin 
11082d65b5eSSasha Levin 	if (stat(path, &st) == 0 &&
11182d65b5eSSasha Levin 	    S_ISDIR(st.st_mode)) {
11282d65b5eSSasha Levin 		char tmp[PATH_MAX];
11382d65b5eSSasha Levin 
11447621338SSasha Levin 		if (kvm->cfg.using_rootfs)
1152c908af9SLai Jiangshan 			die("Please use only one rootfs directory atmost");
1162c908af9SLai Jiangshan 
11782d65b5eSSasha Levin 		if (realpath(path, tmp) == 0 ||
11882d65b5eSSasha Levin 		    virtio_9p__register(kvm, tmp, "/dev/root") < 0)
11982d65b5eSSasha Levin 			die("Unable to initialize virtio 9p");
12082d65b5eSSasha Levin 		if (virtio_9p__register(kvm, "/", "hostfs") < 0)
12182d65b5eSSasha Levin 			die("Unable to initialize virtio 9p");
12269c88b95SSasha Levin 		kvm_setup_resolv(arg);
12347621338SSasha Levin 		kvm->cfg.using_rootfs = kvm->cfg.custom_rootfs = 1;
12447621338SSasha Levin 		kvm->cfg.custom_rootfs_name = arg;
12582d65b5eSSasha Levin 		return 0;
12682d65b5eSSasha Levin 	}
12782d65b5eSSasha Levin 
12847621338SSasha Levin 	if (kvm->cfg.image_count >= MAX_DISK_IMAGES)
129a33979d8SSasha Levin 		die("Currently only 4 images are supported");
130a33979d8SSasha Levin 
13147621338SSasha Levin 	kvm->cfg.disk_image[kvm->cfg.image_count].filename = arg;
1325236b505SAsias He 	cur = arg;
133a67da3beSAsias He 
134a67da3beSAsias He 	if (strncmp(arg, "scsi:", 5) == 0) {
135a67da3beSAsias He 		sep = strstr(arg, ":");
136a67da3beSAsias He 		if (sep)
13747621338SSasha Levin 			kvm->cfg.disk_image[kvm->cfg.image_count].wwpn = sep + 1;
138a67da3beSAsias He 		sep = strstr(sep + 1, ":");
139a67da3beSAsias He 		if (sep) {
140a67da3beSAsias He 			*sep = 0;
14147621338SSasha Levin 			kvm->cfg.disk_image[kvm->cfg.image_count].tpgt = sep + 1;
142a67da3beSAsias He 		}
143a67da3beSAsias He 		cur = sep + 1;
144a67da3beSAsias He 	}
145a67da3beSAsias He 
1465236b505SAsias He 	do {
1475236b505SAsias He 		sep = strstr(cur, ",");
148a33979d8SSasha Levin 		if (sep) {
1495236b505SAsias He 			if (strncmp(sep + 1, "ro", 2) == 0)
15047621338SSasha Levin 				kvm->cfg.disk_image[kvm->cfg.image_count].readonly = true;
1515236b505SAsias He 			else if (strncmp(sep + 1, "direct", 6) == 0)
15247621338SSasha Levin 				kvm->cfg.disk_image[kvm->cfg.image_count].direct = true;
153a33979d8SSasha Levin 			*sep = 0;
1545236b505SAsias He 			cur = sep + 1;
155a33979d8SSasha Levin 		}
1565236b505SAsias He 	} while (sep);
157a33979d8SSasha Levin 
15847621338SSasha Levin 	kvm->cfg.image_count++;
159a33979d8SSasha Levin 
160a33979d8SSasha Levin 	return 0;
161a33979d8SSasha Levin }
162a33979d8SSasha Levin 
163b4422bf3SAneesh Kumar K.V static int virtio_9p_rootdir_parser(const struct option *opt, const char *arg, int unset)
164b4422bf3SAneesh Kumar K.V {
165b4422bf3SAneesh Kumar K.V 	char *tag_name;
166b4422bf3SAneesh Kumar K.V 	char tmp[PATH_MAX];
167b4422bf3SAneesh Kumar K.V 
168b4422bf3SAneesh Kumar K.V 	/*
169b4422bf3SAneesh Kumar K.V 	 * 9p dir can be of the form dirname,tag_name or
170b4422bf3SAneesh Kumar K.V 	 * just dirname. In the later case we use the
171b4422bf3SAneesh Kumar K.V 	 * default tag name
172b4422bf3SAneesh Kumar K.V 	 */
173b4422bf3SAneesh Kumar K.V 	tag_name = strstr(arg, ",");
174b4422bf3SAneesh Kumar K.V 	if (tag_name) {
175b4422bf3SAneesh Kumar K.V 		*tag_name = '\0';
176b4422bf3SAneesh Kumar K.V 		tag_name++;
177b4422bf3SAneesh Kumar K.V 	}
17854f6802dSPekka Enberg 	if (realpath(arg, tmp)) {
179c7838fbdSSasha Levin 		if (virtio_9p__register(kvm, tmp, tag_name) < 0)
18054f6802dSPekka Enberg 			die("Unable to initialize virtio 9p");
18154f6802dSPekka Enberg 	} else
182b4422bf3SAneesh Kumar K.V 		die("Failed resolving 9p path");
183b4422bf3SAneesh Kumar K.V 	return 0;
184b4422bf3SAneesh Kumar K.V }
185b4422bf3SAneesh Kumar K.V 
1861add4b76SSasha Levin static int tty_parser(const struct option *opt, const char *arg, int unset)
1871add4b76SSasha Levin {
1881add4b76SSasha Levin 	int tty = atoi(arg);
1891add4b76SSasha Levin 
1901add4b76SSasha Levin 	term_set_tty(tty);
1911add4b76SSasha Levin 
1921add4b76SSasha Levin 	return 0;
1931add4b76SSasha Levin }
1941add4b76SSasha Levin 
1959a6d73f1SSasha Levin static inline void str_to_mac(const char *str, char *mac)
1969a6d73f1SSasha Levin {
1979a6d73f1SSasha Levin 	sscanf(str, "%hhx:%hhx:%hhx:%hhx:%hhx:%hhx",
1989a6d73f1SSasha Levin 		mac, mac+1, mac+2, mac+3, mac+4, mac+5);
1999a6d73f1SSasha Levin }
2009a6d73f1SSasha Levin static int set_net_param(struct virtio_net_params *p, const char *param,
2019a6d73f1SSasha Levin 				const char *val)
2029a6d73f1SSasha Levin {
2039a6d73f1SSasha Levin 	if (strcmp(param, "guest_mac") == 0) {
2049a6d73f1SSasha Levin 		str_to_mac(val, p->guest_mac);
2059a6d73f1SSasha Levin 	} else if (strcmp(param, "mode") == 0) {
2069a6d73f1SSasha Levin 		if (!strncmp(val, "user", 4)) {
2079a6d73f1SSasha Levin 			int i;
2089a6d73f1SSasha Levin 
20947621338SSasha Levin 			for (i = 0; i < kvm->cfg.num_net_devices; i++)
21047621338SSasha Levin 				if (kvm->cfg.net_params[i].mode == NET_MODE_USER)
2119a6d73f1SSasha Levin 					die("Only one usermode network device allowed at a time");
2129a6d73f1SSasha Levin 			p->mode = NET_MODE_USER;
2139a6d73f1SSasha Levin 		} else if (!strncmp(val, "tap", 3)) {
2149a6d73f1SSasha Levin 			p->mode = NET_MODE_TAP;
2159a6d73f1SSasha Levin 		} else if (!strncmp(val, "none", 4)) {
21647621338SSasha Levin 			kvm->cfg.no_net = 1;
2179a6d73f1SSasha Levin 			return -1;
2189a6d73f1SSasha Levin 		} else
21947621338SSasha Levin 			die("Unknown network mode %s, please use user, tap or none", kvm->cfg.network);
2209a6d73f1SSasha Levin 	} else if (strcmp(param, "script") == 0) {
2219a6d73f1SSasha Levin 		p->script = strdup(val);
2229a6d73f1SSasha Levin 	} else if (strcmp(param, "guest_ip") == 0) {
2239a6d73f1SSasha Levin 		p->guest_ip = strdup(val);
2249a6d73f1SSasha Levin 	} else if (strcmp(param, "host_ip") == 0) {
2259a6d73f1SSasha Levin 		p->host_ip = strdup(val);
22669205aa1SAsias He 	} else if (strcmp(param, "trans") == 0) {
22769205aa1SAsias He 		p->trans = strdup(val);
2289ed67cdcSSasha Levin 	} else if (strcmp(param, "vhost") == 0) {
2299ed67cdcSSasha Levin 		p->vhost = atoi(val);
230f19edd1eSSasha Levin 	} else if (strcmp(param, "fd") == 0) {
231f19edd1eSSasha Levin 		p->fd = atoi(val);
23221aa628eSMichael Ellerman 	} else
23321aa628eSMichael Ellerman 		die("Unknown network parameter %s", param);
2349a6d73f1SSasha Levin 
2359a6d73f1SSasha Levin 	return 0;
2369a6d73f1SSasha Levin }
2379a6d73f1SSasha Levin 
2389a6d73f1SSasha Levin static int netdev_parser(const struct option *opt, const char *arg, int unset)
2399a6d73f1SSasha Levin {
2409a6d73f1SSasha Levin 	struct virtio_net_params p;
2419a6d73f1SSasha Levin 	char *buf = NULL, *cmd = NULL, *cur = NULL;
2429a6d73f1SSasha Levin 	bool on_cmd = true;
2439a6d73f1SSasha Levin 
2449a6d73f1SSasha Levin 	if (arg) {
2459a6d73f1SSasha Levin 		buf = strdup(arg);
2469a6d73f1SSasha Levin 		if (buf == NULL)
2479a6d73f1SSasha Levin 			die("Failed allocating new net buffer");
2489a6d73f1SSasha Levin 		cur = strtok(buf, ",=");
2499a6d73f1SSasha Levin 	}
2509a6d73f1SSasha Levin 
2519a6d73f1SSasha Levin 	p = (struct virtio_net_params) {
2529a6d73f1SSasha Levin 		.guest_ip	= DEFAULT_GUEST_ADDR,
2539a6d73f1SSasha Levin 		.host_ip	= DEFAULT_HOST_ADDR,
2549a6d73f1SSasha Levin 		.script		= DEFAULT_SCRIPT,
2559a6d73f1SSasha Levin 		.mode		= NET_MODE_TAP,
2569a6d73f1SSasha Levin 	};
2579a6d73f1SSasha Levin 
2589a6d73f1SSasha Levin 	str_to_mac(DEFAULT_GUEST_MAC, p.guest_mac);
25947621338SSasha Levin 	p.guest_mac[5] += kvm->cfg.num_net_devices;
2609a6d73f1SSasha Levin 
2619a6d73f1SSasha Levin 	while (cur) {
2629a6d73f1SSasha Levin 		if (on_cmd) {
2639a6d73f1SSasha Levin 			cmd = cur;
2649a6d73f1SSasha Levin 		} else {
2659a6d73f1SSasha Levin 			if (set_net_param(&p, cmd, cur) < 0)
2669a6d73f1SSasha Levin 				goto done;
2679a6d73f1SSasha Levin 		}
2689a6d73f1SSasha Levin 		on_cmd = !on_cmd;
2699a6d73f1SSasha Levin 
2709a6d73f1SSasha Levin 		cur = strtok(NULL, ",=");
2719a6d73f1SSasha Levin 	};
2729a6d73f1SSasha Levin 
27347621338SSasha Levin 	kvm->cfg.num_net_devices++;
2749a6d73f1SSasha Levin 
27547621338SSasha Levin 	kvm->cfg.net_params = realloc(kvm->cfg.net_params, kvm->cfg.num_net_devices * sizeof(*kvm->cfg.net_params));
27647621338SSasha Levin 	if (kvm->cfg.net_params == NULL)
2779a6d73f1SSasha Levin 		die("Failed adding new network device");
2789a6d73f1SSasha Levin 
27947621338SSasha Levin 	kvm->cfg.net_params[kvm->cfg.num_net_devices - 1] = p;
2809a6d73f1SSasha Levin 
2819a6d73f1SSasha Levin done:
2829a6d73f1SSasha Levin 	free(buf);
2839a6d73f1SSasha Levin 	return 0;
2849a6d73f1SSasha Levin }
2859a6d73f1SSasha Levin 
28695d13a52SSasha Levin static int shmem_parser(const struct option *opt, const char *arg, int unset)
28795d13a52SSasha Levin {
28872f1ad6dSSasha Levin 	const u64 default_size = SHMEM_DEFAULT_SIZE;
28972f1ad6dSSasha Levin 	const u64 default_phys_addr = SHMEM_DEFAULT_ADDR;
29095d13a52SSasha Levin 	const char *default_handle = SHMEM_DEFAULT_HANDLE;
29195d13a52SSasha Levin 	struct shmem_info *si = malloc(sizeof(struct shmem_info));
29272f1ad6dSSasha Levin 	u64 phys_addr;
29372f1ad6dSSasha Levin 	u64 size;
29495d13a52SSasha Levin 	char *handle = NULL;
29595d13a52SSasha Levin 	int create = 0;
29695d13a52SSasha Levin 	const char *p = arg;
29795d13a52SSasha Levin 	char *next;
29895d13a52SSasha Levin 	int base = 10;
29995d13a52SSasha Levin 	int verbose = 0;
30095d13a52SSasha Levin 
30195d13a52SSasha Levin 	const int skip_pci = strlen("pci:");
30295d13a52SSasha Levin 	if (verbose)
30395d13a52SSasha Levin 		pr_info("shmem_parser(%p,%s,%d)", opt, arg, unset);
30495d13a52SSasha Levin 	/* parse out optional addr family */
30595d13a52SSasha Levin 	if (strcasestr(p, "pci:")) {
30695d13a52SSasha Levin 		p += skip_pci;
30795d13a52SSasha Levin 	} else if (strcasestr(p, "mem:")) {
30895d13a52SSasha Levin 		die("I can't add to E820 map yet.\n");
30995d13a52SSasha Levin 	}
31095d13a52SSasha Levin 	/* parse out physical addr */
31195d13a52SSasha Levin 	base = 10;
31295d13a52SSasha Levin 	if (strcasestr(p, "0x"))
31395d13a52SSasha Levin 		base = 16;
31495d13a52SSasha Levin 	phys_addr = strtoll(p, &next, base);
31595d13a52SSasha Levin 	if (next == p && phys_addr == 0) {
31695d13a52SSasha Levin 		pr_info("shmem: no physical addr specified, using default.");
31795d13a52SSasha Levin 		phys_addr = default_phys_addr;
31895d13a52SSasha Levin 	}
31995d13a52SSasha Levin 	if (*next != ':' && *next != '\0')
32095d13a52SSasha Levin 		die("shmem: unexpected chars after phys addr.\n");
32195d13a52SSasha Levin 	if (*next == '\0')
32295d13a52SSasha Levin 		p = next;
32395d13a52SSasha Levin 	else
32495d13a52SSasha Levin 		p = next + 1;
32595d13a52SSasha Levin 	/* parse out size */
32695d13a52SSasha Levin 	base = 10;
32795d13a52SSasha Levin 	if (strcasestr(p, "0x"))
32895d13a52SSasha Levin 		base = 16;
32995d13a52SSasha Levin 	size = strtoll(p, &next, base);
33095d13a52SSasha Levin 	if (next == p && size == 0) {
33195d13a52SSasha Levin 		pr_info("shmem: no size specified, using default.");
33295d13a52SSasha Levin 		size = default_size;
33395d13a52SSasha Levin 	}
33495d13a52SSasha Levin 	/* look for [KMGkmg][Bb]*  uses base 2. */
33595d13a52SSasha Levin 	int skip_B = 0;
33695d13a52SSasha Levin 	if (strspn(next, "KMGkmg")) {	/* might have a prefix */
33795d13a52SSasha Levin 		if (*(next + 1) == 'B' || *(next + 1) == 'b')
33895d13a52SSasha Levin 			skip_B = 1;
33995d13a52SSasha Levin 		switch (*next) {
34095d13a52SSasha Levin 		case 'K':
34195d13a52SSasha Levin 		case 'k':
34295d13a52SSasha Levin 			size = size << KB_SHIFT;
34395d13a52SSasha Levin 			break;
34495d13a52SSasha Levin 		case 'M':
34595d13a52SSasha Levin 		case 'm':
34695d13a52SSasha Levin 			size = size << MB_SHIFT;
34795d13a52SSasha Levin 			break;
34895d13a52SSasha Levin 		case 'G':
34995d13a52SSasha Levin 		case 'g':
35095d13a52SSasha Levin 			size = size << GB_SHIFT;
35195d13a52SSasha Levin 			break;
35295d13a52SSasha Levin 		default:
35395d13a52SSasha Levin 			die("shmem: bug in detecting size prefix.");
35495d13a52SSasha Levin 			break;
35595d13a52SSasha Levin 		}
35695d13a52SSasha Levin 		next += 1 + skip_B;
35795d13a52SSasha Levin 	}
35895d13a52SSasha Levin 	if (*next != ':' && *next != '\0') {
35995d13a52SSasha Levin 		die("shmem: unexpected chars after phys size. <%c><%c>\n",
36095d13a52SSasha Levin 		    *next, *p);
36195d13a52SSasha Levin 	}
36295d13a52SSasha Levin 	if (*next == '\0')
36395d13a52SSasha Levin 		p = next;
36495d13a52SSasha Levin 	else
36595d13a52SSasha Levin 		p = next + 1;
36695d13a52SSasha Levin 	/* parse out optional shmem handle */
36795d13a52SSasha Levin 	const int skip_handle = strlen("handle=");
36895d13a52SSasha Levin 	next = strcasestr(p, "handle=");
36995d13a52SSasha Levin 	if (*p && next) {
37095d13a52SSasha Levin 		if (p != next)
37195d13a52SSasha Levin 			die("unexpected chars before handle\n");
37295d13a52SSasha Levin 		p += skip_handle;
37395d13a52SSasha Levin 		next = strchrnul(p, ':');
37495d13a52SSasha Levin 		if (next - p) {
37595d13a52SSasha Levin 			handle = malloc(next - p + 1);
37695d13a52SSasha Levin 			strncpy(handle, p, next - p);
37795d13a52SSasha Levin 			handle[next - p] = '\0';	/* just in case. */
37895d13a52SSasha Levin 		}
37995d13a52SSasha Levin 		if (*next == '\0')
38095d13a52SSasha Levin 			p = next;
38195d13a52SSasha Levin 		else
38295d13a52SSasha Levin 			p = next + 1;
38395d13a52SSasha Levin 	}
38495d13a52SSasha Levin 	/* parse optional create flag to see if we should create shm seg. */
38595d13a52SSasha Levin 	if (*p && strcasestr(p, "create")) {
38695d13a52SSasha Levin 		create = 1;
38795d13a52SSasha Levin 		p += strlen("create");
38895d13a52SSasha Levin 	}
38995d13a52SSasha Levin 	if (*p != '\0')
39095d13a52SSasha Levin 		die("shmem: unexpected trailing chars\n");
39195d13a52SSasha Levin 	if (handle == NULL) {
39295d13a52SSasha Levin 		handle = malloc(strlen(default_handle) + 1);
39395d13a52SSasha Levin 		strcpy(handle, default_handle);
39495d13a52SSasha Levin 	}
39595d13a52SSasha Levin 	if (verbose) {
39672f1ad6dSSasha Levin 		pr_info("shmem: phys_addr = %llx", phys_addr);
39772f1ad6dSSasha Levin 		pr_info("shmem: size      = %llx", size);
39895d13a52SSasha Levin 		pr_info("shmem: handle    = %s", handle);
39995d13a52SSasha Levin 		pr_info("shmem: create    = %d", create);
40095d13a52SSasha Levin 	}
40195d13a52SSasha Levin 
40295d13a52SSasha Levin 	si->phys_addr = phys_addr;
40395d13a52SSasha Levin 	si->size = size;
40495d13a52SSasha Levin 	si->handle = handle;
40595d13a52SSasha Levin 	si->create = create;
40695d13a52SSasha Levin 	pci_shmem__register_mem(si);	/* ownership of si, etc. passed on. */
40795d13a52SSasha Levin 	return 0;
40895d13a52SSasha Levin }
409b4422bf3SAneesh Kumar K.V 
410b816364aSSasha Levin #define BUILD_OPTIONS(name, cfg)					\
411b816364aSSasha Levin 	struct option name[] = {					\
412b816364aSSasha Levin 	OPT_GROUP("Basic options:"),					\
413b816364aSSasha Levin 	OPT_STRING('\0', "name", &(cfg)->guest_name, "guest name",	\
414b816364aSSasha Levin 			"A name for the guest"),			\
415b816364aSSasha Levin 	OPT_INTEGER('c', "cpus", &nrcpus, "Number of CPUs"),		\
416b816364aSSasha Levin 	OPT_U64('m', "mem", &(cfg)->ram_size, "Virtual machine memory size\
417b816364aSSasha Levin 		in MiB."),						\
418b816364aSSasha Levin 	OPT_CALLBACK('\0', "shmem", NULL,				\
419b816364aSSasha Levin 		     "[pci:]<addr>:<size>[:handle=<handle>][:create]",	\
420b816364aSSasha Levin 		     "Share host shmem with guest via pci device",	\
421b816364aSSasha Levin 		     shmem_parser),					\
422b816364aSSasha Levin 	OPT_CALLBACK('d', "disk", NULL, "image or rootfs_dir", "Disk	\
423b816364aSSasha Levin 			image or rootfs directory", img_name_parser),	\
424b816364aSSasha Levin 	OPT_BOOLEAN('\0', "balloon", &(cfg)->balloon, "Enable virtio	\
425b816364aSSasha Levin 			balloon"),					\
426b816364aSSasha Levin 	OPT_BOOLEAN('\0', "vnc", &(cfg)->vnc, "Enable VNC framebuffer"),\
427b816364aSSasha Levin 	OPT_BOOLEAN('\0', "sdl", &(cfg)->sdl, "Enable SDL framebuffer"),\
428b816364aSSasha Levin 	OPT_BOOLEAN('\0', "rng", &(cfg)->virtio_rng, "Enable virtio Random\
429b816364aSSasha Levin 			Number Generator"),				\
430b816364aSSasha Levin 	OPT_CALLBACK('\0', "9p", NULL, "dir_to_share,tag_name",		\
431b816364aSSasha Levin 		     "Enable virtio 9p to share files between host and	\
432b816364aSSasha Levin 		     guest", virtio_9p_rootdir_parser),			\
433b816364aSSasha Levin 	OPT_STRING('\0', "console", &(cfg)->console, "serial, virtio or	\
434b816364aSSasha Levin 			hv", "Console to use"),				\
435b816364aSSasha Levin 	OPT_STRING('\0', "dev", &(cfg)->dev, "device_file",		\
436b816364aSSasha Levin 			"KVM device file"),				\
437b816364aSSasha Levin 	OPT_CALLBACK('\0', "tty", NULL, "tty id",			\
438b816364aSSasha Levin 		     "Remap guest TTY into a pty on the host",		\
439b816364aSSasha Levin 		     tty_parser),					\
440b816364aSSasha Levin 	OPT_STRING('\0', "sandbox", &(cfg)->sandbox, "script",		\
441b816364aSSasha Levin 			"Run this script when booting into custom	\
442b816364aSSasha Levin 			rootfs"),					\
443b816364aSSasha Levin 	OPT_STRING('\0', "hugetlbfs", &(cfg)->hugetlbfs_path, "path",	\
444b816364aSSasha Levin 			"Hugetlbfs path"),				\
445b816364aSSasha Levin 									\
446b816364aSSasha Levin 	OPT_GROUP("Kernel options:"),					\
447b816364aSSasha Levin 	OPT_STRING('k', "kernel", &(cfg)->kernel_filename, "kernel",	\
448b816364aSSasha Levin 			"Kernel to boot in virtual machine"),		\
449b816364aSSasha Levin 	OPT_STRING('i', "initrd", &(cfg)->initrd_filename, "initrd",	\
450b816364aSSasha Levin 			"Initial RAM disk image"),			\
451b816364aSSasha Levin 	OPT_STRING('p', "params", &(cfg)->kernel_cmdline, "params",	\
452b816364aSSasha Levin 			"Kernel command line arguments"),		\
453b816364aSSasha Levin 	OPT_STRING('f', "firmware", &(cfg)->firmware_filename, "firmware",\
454b816364aSSasha Levin 			"Firmware image to boot in virtual machine"),	\
455b816364aSSasha Levin 									\
456b816364aSSasha Levin 	OPT_GROUP("Networking options:"),				\
457b816364aSSasha Levin 	OPT_CALLBACK_DEFAULT('n', "network", NULL, "network params",	\
458b816364aSSasha Levin 		     "Create a new guest NIC",				\
459b816364aSSasha Levin 		     netdev_parser, NULL),				\
460b816364aSSasha Levin 	OPT_BOOLEAN('\0', "no-dhcp", &(cfg)->no_dhcp, "Disable kernel DHCP\
461b816364aSSasha Levin 			in rootfs mode"),				\
462b816364aSSasha Levin 									\
463b816364aSSasha Levin 	OPT_GROUP("BIOS options:"),					\
464b816364aSSasha Levin 	OPT_INTEGER('\0', "vidmode", &vidmode,				\
465b816364aSSasha Levin 		    "Video mode"),					\
466b816364aSSasha Levin 									\
467b816364aSSasha Levin 	OPT_GROUP("Debug options:"),					\
468b816364aSSasha Levin 	OPT_BOOLEAN('\0', "debug", &do_debug_print,			\
469b816364aSSasha Levin 			"Enable debug messages"),			\
470b816364aSSasha Levin 	OPT_BOOLEAN('\0', "debug-single-step", &(cfg)->single_step,	\
471b816364aSSasha Levin 			"Enable single stepping"),			\
4725765977dSSasha Levin 	OPT_BOOLEAN('\0', "debug-ioport", &(cfg)->ioport_debug,		\
473b816364aSSasha Levin 			"Enable ioport debugging"),			\
474*e830cce7SSasha Levin 	OPT_BOOLEAN('\0', "debug-mmio", &(cfg)->mmio_debug,		\
475b816364aSSasha Levin 			"Enable MMIO debugging"),			\
476b816364aSSasha Levin 	OPT_INTEGER('\0', "debug-iodelay", &debug_iodelay,		\
477b816364aSSasha Levin 			"Delay IO by millisecond"),			\
478b816364aSSasha Levin 	OPT_END()							\
479f967c427SPrasad Joshi 	};
480f967c427SPrasad Joshi 
481b5b501ccSIngo Molnar /*
482b5b501ccSIngo Molnar  * Serialize debug printout so that the output of multiple vcpus does not
483b5b501ccSIngo Molnar  * get mixed up:
484b5b501ccSIngo Molnar  */
485cffeab25SIngo Molnar static int printout_done;
486b5b501ccSIngo Molnar 
48743119af7SPekka Enberg static void handle_sigusr1(int sig)
48843119af7SPekka Enberg {
48943119af7SPekka Enberg 	struct kvm_cpu *cpu = current_kvm_cpu;
490b7d2f013SSasha Levin 	int fd = kvm_cpu__get_debug_fd();
49143119af7SPekka Enberg 
4924b1c6f6eSSasha Levin 	if (!cpu || cpu->needs_nmi)
49343119af7SPekka Enberg 		return;
49443119af7SPekka Enberg 
495b7d2f013SSasha Levin 	dprintf(fd, "\n #\n # vCPU #%ld's dump:\n #\n", cpu->cpu_id);
49643119af7SPekka Enberg 	kvm_cpu__show_registers(cpu);
49743119af7SPekka Enberg 	kvm_cpu__show_code(cpu);
49843119af7SPekka Enberg 	kvm_cpu__show_page_tables(cpu);
499b5b501ccSIngo Molnar 	fflush(stdout);
500cffeab25SIngo Molnar 	printout_done = 1;
501cffeab25SIngo Molnar 	mb();
50243119af7SPekka Enberg }
50343119af7SPekka Enberg 
504d94e22b9SSasha Levin /* Pause/resume the guest using SIGUSR2 */
505d94e22b9SSasha Levin static int is_paused;
506d94e22b9SSasha Levin 
5074b1addaeSSasha Levin static void handle_pause(int fd, u32 type, u32 len, u8 *msg)
508d94e22b9SSasha Levin {
5095aa502e4SLai Jiangshan 	if (WARN_ON(len))
5105aa502e4SLai Jiangshan 		return;
5115aa502e4SLai Jiangshan 
5127021c50bSAsias He 	if (type == KVM_IPC_RESUME && is_paused) {
5137021c50bSAsias He 		kvm->vm_state = KVM_VMSTATE_RUNNING;
514d94e22b9SSasha Levin 		kvm__continue();
5157021c50bSAsias He 	} else if (type == KVM_IPC_PAUSE && !is_paused) {
5167021c50bSAsias He 		kvm->vm_state = KVM_VMSTATE_PAUSED;
517eb8dad9dSSasha Levin 		ioctl(kvm->vm_fd, KVM_KVMCLOCK_CTRL);
518d94e22b9SSasha Levin 		kvm__pause();
5197021c50bSAsias He 	} else {
52002317b74SSasha Levin 		return;
5215aa502e4SLai Jiangshan 	}
522d94e22b9SSasha Levin 
523d94e22b9SSasha Levin 	is_paused = !is_paused;
524d94e22b9SSasha Levin }
525d94e22b9SSasha Levin 
5267021c50bSAsias He static void handle_vmstate(int fd, u32 type, u32 len, u8 *msg)
5277021c50bSAsias He {
5287021c50bSAsias He 	int r = 0;
5297021c50bSAsias He 
5307021c50bSAsias He 	if (type == KVM_IPC_VMSTATE)
5317021c50bSAsias He 		r = write(fd, &kvm->vm_state, sizeof(kvm->vm_state));
5327021c50bSAsias He 
5337021c50bSAsias He 	if (r < 0)
5347021c50bSAsias He 		pr_warning("Failed sending VMSTATE");
5357021c50bSAsias He }
5367021c50bSAsias He 
5374b1addaeSSasha Levin static void handle_debug(int fd, u32 type, u32 len, u8 *msg)
5389e854d1aSPekka Enberg {
5399e854d1aSPekka Enberg 	int i;
540a59cdf44SLai Jiangshan 	struct debug_cmd_params *params;
541a59cdf44SLai Jiangshan 	u32 dbg_type;
542a59cdf44SLai Jiangshan 	u32 vcpu;
543a59cdf44SLai Jiangshan 
544a59cdf44SLai Jiangshan 	if (WARN_ON(type != KVM_IPC_DEBUG || len != sizeof(*params)))
545a59cdf44SLai Jiangshan 		return;
546a59cdf44SLai Jiangshan 
547a59cdf44SLai Jiangshan 	params = (void *)msg;
548a59cdf44SLai Jiangshan 	dbg_type = params->dbg_type;
549a59cdf44SLai Jiangshan 	vcpu = params->cpu;
5504b1c6f6eSSasha Levin 
551226e727bSSasha Levin 	if (dbg_type & KVM_DEBUG_CMD_TYPE_SYSRQ)
552226e727bSSasha Levin 		serial8250__inject_sysrq(kvm, params->sysrq);
553226e727bSSasha Levin 
5544b1c6f6eSSasha Levin 	if (dbg_type & KVM_DEBUG_CMD_TYPE_NMI) {
5557070414aSSasha Levin 		if ((int)vcpu >= kvm->nrcpus)
5564b1c6f6eSSasha Levin 			return;
5574b1c6f6eSSasha Levin 
5584b1c6f6eSSasha Levin 		kvm_cpus[vcpu]->needs_nmi = 1;
5594b1c6f6eSSasha Levin 		pthread_kill(kvm_cpus[vcpu]->thread, SIGUSR1);
5604b1c6f6eSSasha Levin 	}
5614b1c6f6eSSasha Levin 
5624b1c6f6eSSasha Levin 	if (!(dbg_type & KVM_DEBUG_CMD_TYPE_DUMP))
5634b1c6f6eSSasha Levin 		return;
5649e854d1aSPekka Enberg 
5659e854d1aSPekka Enberg 	for (i = 0; i < nrcpus; i++) {
5669e854d1aSPekka Enberg 		struct kvm_cpu *cpu = kvm_cpus[i];
5679e854d1aSPekka Enberg 
56843119af7SPekka Enberg 		if (!cpu)
56943119af7SPekka Enberg 			continue;
57043119af7SPekka Enberg 
571cffeab25SIngo Molnar 		printout_done = 0;
572b7d2f013SSasha Levin 
573b7d2f013SSasha Levin 		kvm_cpu__set_debug_fd(fd);
57443119af7SPekka Enberg 		pthread_kill(cpu->thread, SIGUSR1);
575cffeab25SIngo Molnar 		/*
576cffeab25SIngo Molnar 		 * Wait for the vCPU to dump state before signalling
577cffeab25SIngo Molnar 		 * the next thread. Since this is debug code it does
578cffeab25SIngo Molnar 		 * not matter that we are burning CPU time a bit:
579cffeab25SIngo Molnar 		 */
580cffeab25SIngo Molnar 		while (!printout_done)
581cffeab25SIngo Molnar 			mb();
5829e854d1aSPekka Enberg 	}
5839e854d1aSPekka Enberg 
584b7d2f013SSasha Levin 	close(fd);
585b7d2f013SSasha Levin 
586226e727bSSasha Levin 	serial8250__inject_sysrq(kvm, 'p');
5879e854d1aSPekka Enberg }
5889e854d1aSPekka Enberg 
5899e854d1aSPekka Enberg static void handle_sigalrm(int sig)
5909e854d1aSPekka Enberg {
5910b69bdefSMatt Evans 	kvm__arch_periodic_poll(kvm);
5929e854d1aSPekka Enberg }
5939e854d1aSPekka Enberg 
5944b1addaeSSasha Levin static void handle_stop(int fd, u32 type, u32 len, u8 *msg)
595daf4cb5aSSasha Levin {
596e333e41aSLai Jiangshan 	if (WARN_ON(type != KVM_IPC_STOP || len))
597e333e41aSLai Jiangshan 		return;
598e333e41aSLai Jiangshan 
599daf4cb5aSSasha Levin 	kvm_cpu__reboot();
600daf4cb5aSSasha Levin }
601daf4cb5aSSasha Levin 
6025ee154d1SPekka Enberg static void *kvm_cpu_thread(void *arg)
6035ee154d1SPekka Enberg {
604d77a9efaSCyrill Gorcunov 	current_kvm_cpu		= arg;
6055ee154d1SPekka Enberg 
606d77a9efaSCyrill Gorcunov 	if (kvm_cpu__start(current_kvm_cpu))
6075ee154d1SPekka Enberg 		goto panic_kvm;
6085ee154d1SPekka Enberg 
6095ee154d1SPekka Enberg 	return (void *) (intptr_t) 0;
6105ee154d1SPekka Enberg 
6115ee154d1SPekka Enberg panic_kvm:
6123fdf659dSSasha Levin 	fprintf(stderr, "KVM exit reason: %u (\"%s\")\n",
613d77a9efaSCyrill Gorcunov 		current_kvm_cpu->kvm_run->exit_reason,
614d77a9efaSCyrill Gorcunov 		kvm_exit_reasons[current_kvm_cpu->kvm_run->exit_reason]);
615d77a9efaSCyrill Gorcunov 	if (current_kvm_cpu->kvm_run->exit_reason == KVM_EXIT_UNKNOWN)
6165ee154d1SPekka Enberg 		fprintf(stderr, "KVM exit code: 0x%Lu\n",
617d77a9efaSCyrill Gorcunov 			current_kvm_cpu->kvm_run->hw.hardware_exit_reason);
6188e5accedSPekka Enberg 
619b7d2f013SSasha Levin 	kvm_cpu__set_debug_fd(STDOUT_FILENO);
620d77a9efaSCyrill Gorcunov 	kvm_cpu__show_registers(current_kvm_cpu);
621d77a9efaSCyrill Gorcunov 	kvm_cpu__show_code(current_kvm_cpu);
622d77a9efaSCyrill Gorcunov 	kvm_cpu__show_page_tables(current_kvm_cpu);
6235ee154d1SPekka Enberg 
6245ee154d1SPekka Enberg 	return (void *) (intptr_t) 1;
6255ee154d1SPekka Enberg }
6265ee154d1SPekka Enberg 
627e08c0896SPrasad Joshi static char kernel[PATH_MAX];
628b0b42ba0SPekka Enberg 
629b0b42ba0SPekka Enberg static const char *host_kernels[] = {
630e08c0896SPrasad Joshi 	"/boot/vmlinuz",
631e08c0896SPrasad Joshi 	"/boot/bzImage",
632e08c0896SPrasad Joshi 	NULL
633e08c0896SPrasad Joshi };
634b0b42ba0SPekka Enberg 
635b0b42ba0SPekka Enberg static const char *default_kernels[] = {
636e08c0896SPrasad Joshi 	"./bzImage",
637b03af790SKonstantin Khlebnikov 	"arch/" BUILD_ARCH "/boot/bzImage",
638af7b0868SMatt Evans 	"../../arch/" BUILD_ARCH "/boot/bzImage",
639e08c0896SPrasad Joshi 	NULL
640e08c0896SPrasad Joshi };
6418329f30bSPekka Enberg 
642b0b42ba0SPekka Enberg static const char *default_vmlinux[] = {
643b03af790SKonstantin Khlebnikov 	"vmlinux",
644b0b42ba0SPekka Enberg 	"../../../vmlinux",
645b0b42ba0SPekka Enberg 	"../../vmlinux",
646b0b42ba0SPekka Enberg 	NULL
647b0b42ba0SPekka Enberg };
648b0b42ba0SPekka Enberg 
649e08c0896SPrasad Joshi static void kernel_usage_with_options(void)
6508329f30bSPekka Enberg {
651e08c0896SPrasad Joshi 	const char **k;
6528329f30bSPekka Enberg 	struct utsname uts;
653e08c0896SPrasad Joshi 
654e08c0896SPrasad Joshi 	fprintf(stderr, "Fatal: could not find default kernel image in:\n");
65565182f37SPrasad Joshi 	k = &default_kernels[0];
656e08c0896SPrasad Joshi 	while (*k) {
657e08c0896SPrasad Joshi 		fprintf(stderr, "\t%s\n", *k);
658e08c0896SPrasad Joshi 		k++;
659e08c0896SPrasad Joshi 	}
660e08c0896SPrasad Joshi 
661e08c0896SPrasad Joshi 	if (uname(&uts) < 0)
662e08c0896SPrasad Joshi 		return;
663e08c0896SPrasad Joshi 
664e08c0896SPrasad Joshi 	k = &host_kernels[0];
665e08c0896SPrasad Joshi 	while (*k) {
666e08c0896SPrasad Joshi 		if (snprintf(kernel, PATH_MAX, "%s-%s", *k, uts.release) < 0)
667e08c0896SPrasad Joshi 			return;
668e08c0896SPrasad Joshi 		fprintf(stderr, "\t%s\n", kernel);
669e08c0896SPrasad Joshi 		k++;
670e08c0896SPrasad Joshi 	}
671ee8b1456SWanlong Gao 	fprintf(stderr, "\nPlease see '%s run --help' for more options.\n\n",
672ee8b1456SWanlong Gao 		KVM_BINARY_NAME);
673e08c0896SPrasad Joshi }
674e08c0896SPrasad Joshi 
67560ded003SPekka Enberg static u64 host_ram_size(void)
67660ded003SPekka Enberg {
67760ded003SPekka Enberg 	long page_size;
67860ded003SPekka Enberg 	long nr_pages;
67960ded003SPekka Enberg 
68060ded003SPekka Enberg 	nr_pages	= sysconf(_SC_PHYS_PAGES);
681d63c5ce6SPekka Enberg 	if (nr_pages < 0) {
6824542f276SCyrill Gorcunov 		pr_warning("sysconf(_SC_PHYS_PAGES) failed");
683d63c5ce6SPekka Enberg 		return 0;
684d63c5ce6SPekka Enberg 	}
68560ded003SPekka Enberg 
68660ded003SPekka Enberg 	page_size	= sysconf(_SC_PAGE_SIZE);
687d63c5ce6SPekka Enberg 	if (page_size < 0) {
6884542f276SCyrill Gorcunov 		pr_warning("sysconf(_SC_PAGE_SIZE) failed");
689d63c5ce6SPekka Enberg 		return 0;
690d63c5ce6SPekka Enberg 	}
69160ded003SPekka Enberg 
69260ded003SPekka Enberg 	return (nr_pages * page_size) >> MB_SHIFT;
69360ded003SPekka Enberg }
69460ded003SPekka Enberg 
69518bd8c3bSPekka Enberg /*
69618bd8c3bSPekka Enberg  * If user didn't specify how much memory it wants to allocate for the guest,
69718bd8c3bSPekka Enberg  * avoid filling the whole host RAM.
69818bd8c3bSPekka Enberg  */
69918bd8c3bSPekka Enberg #define RAM_SIZE_RATIO		0.8
70018bd8c3bSPekka Enberg 
701fd834defSPekka Enberg static u64 get_ram_size(int nr_cpus)
702fd834defSPekka Enberg {
70306761c76SPekka Enberg 	u64 available;
70406761c76SPekka Enberg 	u64 ram_size;
705fd834defSPekka Enberg 
706fd834defSPekka Enberg 	ram_size	= 64 * (nr_cpus + 3);
707fd834defSPekka Enberg 
70860ded003SPekka Enberg 	available	= host_ram_size() * RAM_SIZE_RATIO;
709d63c5ce6SPekka Enberg 	if (!available)
710d63c5ce6SPekka Enberg 		available = MIN_RAM_SIZE_MB;
711fd834defSPekka Enberg 
712fd834defSPekka Enberg 	if (ram_size > available)
713fd834defSPekka Enberg 		ram_size	= available;
714fd834defSPekka Enberg 
715fd834defSPekka Enberg 	return ram_size;
716fd834defSPekka Enberg }
717fd834defSPekka Enberg 
718e08c0896SPrasad Joshi static const char *find_kernel(void)
719e08c0896SPrasad Joshi {
720e08c0896SPrasad Joshi 	const char **k;
7218329f30bSPekka Enberg 	struct stat st;
722e08c0896SPrasad Joshi 	struct utsname uts;
723e08c0896SPrasad Joshi 
72465182f37SPrasad Joshi 	k = &default_kernels[0];
725e08c0896SPrasad Joshi 	while (*k) {
726e08c0896SPrasad Joshi 		if (stat(*k, &st) < 0 || !S_ISREG(st.st_mode)) {
727e08c0896SPrasad Joshi 			k++;
728e08c0896SPrasad Joshi 			continue;
729e08c0896SPrasad Joshi 		}
730e08c0896SPrasad Joshi 		strncpy(kernel, *k, PATH_MAX);
731e08c0896SPrasad Joshi 		return kernel;
732e08c0896SPrasad Joshi 	}
7338329f30bSPekka Enberg 
7348329f30bSPekka Enberg 	if (uname(&uts) < 0)
7358329f30bSPekka Enberg 		return NULL;
7368329f30bSPekka Enberg 
737e08c0896SPrasad Joshi 	k = &host_kernels[0];
738e08c0896SPrasad Joshi 	while (*k) {
739e08c0896SPrasad Joshi 		if (snprintf(kernel, PATH_MAX, "%s-%s", *k, uts.release) < 0)
7408329f30bSPekka Enberg 			return NULL;
7418329f30bSPekka Enberg 
742e08c0896SPrasad Joshi 		if (stat(kernel, &st) < 0 || !S_ISREG(st.st_mode)) {
743e08c0896SPrasad Joshi 			k++;
744e08c0896SPrasad Joshi 			continue;
745e08c0896SPrasad Joshi 		}
746e08c0896SPrasad Joshi 		return kernel;
7478329f30bSPekka Enberg 
748e08c0896SPrasad Joshi 	}
7498329f30bSPekka Enberg 	return NULL;
7508329f30bSPekka Enberg }
7518329f30bSPekka Enberg 
752b0b42ba0SPekka Enberg static const char *find_vmlinux(void)
753b0b42ba0SPekka Enberg {
754b0b42ba0SPekka Enberg 	const char **vmlinux;
755b0b42ba0SPekka Enberg 
756b0b42ba0SPekka Enberg 	vmlinux = &default_vmlinux[0];
757b0b42ba0SPekka Enberg 	while (*vmlinux) {
758b0b42ba0SPekka Enberg 		struct stat st;
759b0b42ba0SPekka Enberg 
760b0b42ba0SPekka Enberg 		if (stat(*vmlinux, &st) < 0 || !S_ISREG(st.st_mode)) {
761b0b42ba0SPekka Enberg 			vmlinux++;
762b0b42ba0SPekka Enberg 			continue;
763b0b42ba0SPekka Enberg 		}
764b0b42ba0SPekka Enberg 		return *vmlinux;
765b0b42ba0SPekka Enberg 	}
766b0b42ba0SPekka Enberg 	return NULL;
767b0b42ba0SPekka Enberg }
768b0b42ba0SPekka Enberg 
769f6677a1dSAmerigo Wang void kvm_run_help(void)
770f6677a1dSAmerigo Wang {
77147621338SSasha Levin 	BUILD_OPTIONS(options, &kvm->cfg);
772f6677a1dSAmerigo Wang 	usage_with_options(run_usage, options);
773f6677a1dSAmerigo Wang }
774f6677a1dSAmerigo Wang 
775afc2c7c0SAsias He static int kvm_setup_guest_init(void)
7769cec19c8SSasha Levin {
77747621338SSasha Levin 	const char *rootfs = kvm->cfg.custom_rootfs_name;
778afc2c7c0SAsias He 	char tmp[PATH_MAX];
779afc2c7c0SAsias He 	size_t size;
780afc2c7c0SAsias He 	int fd, ret;
781afc2c7c0SAsias He 	char *data;
7829cec19c8SSasha Levin 
783afc2c7c0SAsias He 	/* Setup /virt/init */
784afc2c7c0SAsias He 	size = (size_t)&_binary_guest_init_size;
785afc2c7c0SAsias He 	data = (char *)&_binary_guest_init_start;
786afc2c7c0SAsias He 	snprintf(tmp, PATH_MAX, "%s%s/virt/init", kvm__get_dir(), rootfs);
787afc2c7c0SAsias He 	remove(tmp);
788afc2c7c0SAsias He 	fd = open(tmp, O_CREAT | O_WRONLY, 0755);
789afc2c7c0SAsias He 	if (fd < 0)
790afc2c7c0SAsias He 		die("Fail to setup %s", tmp);
791afc2c7c0SAsias He 	ret = xwrite(fd, data, size);
792afc2c7c0SAsias He 	if (ret < 0)
793afc2c7c0SAsias He 		die("Fail to setup %s", tmp);
794afc2c7c0SAsias He 	close(fd);
7959cec19c8SSasha Levin 
796afc2c7c0SAsias He 	return 0;
7979cec19c8SSasha Levin }
7989cec19c8SSasha Levin 
799d50fe489SSasha Levin static int kvm_run_set_sandbox(void)
800d50fe489SSasha Levin {
80147621338SSasha Levin 	const char *guestfs_name = kvm->cfg.custom_rootfs_name;
802d50fe489SSasha Levin 	char path[PATH_MAX], script[PATH_MAX], *tmp;
803d50fe489SSasha Levin 
804d50fe489SSasha Levin 	snprintf(path, PATH_MAX, "%s%s/virt/sandbox.sh", kvm__get_dir(), guestfs_name);
805d50fe489SSasha Levin 
806d50fe489SSasha Levin 	remove(path);
807d50fe489SSasha Levin 
80847621338SSasha Levin 	if (kvm->cfg.sandbox == NULL)
809d50fe489SSasha Levin 		return 0;
810d50fe489SSasha Levin 
81147621338SSasha Levin 	tmp = realpath(kvm->cfg.sandbox, NULL);
812d50fe489SSasha Levin 	if (tmp == NULL)
813d50fe489SSasha Levin 		return -ENOMEM;
814d50fe489SSasha Levin 
815d50fe489SSasha Levin 	snprintf(script, PATH_MAX, "/host/%s", tmp);
816d50fe489SSasha Levin 	free(tmp);
817d50fe489SSasha Levin 
818d50fe489SSasha Levin 	return symlink(script, path);
819d50fe489SSasha Levin }
820d50fe489SSasha Levin 
8215173b4afSLai Jiangshan static void kvm_write_sandbox_cmd_exactly(int fd, const char *arg)
8225173b4afSLai Jiangshan {
8235173b4afSLai Jiangshan 	const char *single_quote;
8245173b4afSLai Jiangshan 
8255173b4afSLai Jiangshan 	if (!*arg) { /* zero length string */
8265173b4afSLai Jiangshan 		if (write(fd, "''", 2) <= 0)
8275173b4afSLai Jiangshan 			die("Failed writing sandbox script");
8285173b4afSLai Jiangshan 		return;
8295173b4afSLai Jiangshan 	}
8305173b4afSLai Jiangshan 
8315173b4afSLai Jiangshan 	while (*arg) {
8325173b4afSLai Jiangshan 		single_quote = strchrnul(arg, '\'');
8335173b4afSLai Jiangshan 
8345173b4afSLai Jiangshan 		/* write non-single-quote string as #('string') */
8355173b4afSLai Jiangshan 		if (arg != single_quote) {
8365173b4afSLai Jiangshan 			if (write(fd, "'", 1) <= 0 ||
8375173b4afSLai Jiangshan 			    write(fd, arg, single_quote - arg) <= 0 ||
8385173b4afSLai Jiangshan 			    write(fd, "'", 1) <= 0)
8395173b4afSLai Jiangshan 				die("Failed writing sandbox script");
8405173b4afSLai Jiangshan 		}
8415173b4afSLai Jiangshan 
8425173b4afSLai Jiangshan 		/* write single quote as #("'") */
8435173b4afSLai Jiangshan 		if (*single_quote) {
8445173b4afSLai Jiangshan 			if (write(fd, "\"'\"", 3) <= 0)
8455173b4afSLai Jiangshan 				die("Failed writing sandbox script");
8465173b4afSLai Jiangshan 		} else
8475173b4afSLai Jiangshan 			break;
8485173b4afSLai Jiangshan 
8495173b4afSLai Jiangshan 		arg = single_quote + 1;
8505173b4afSLai Jiangshan 	}
8515173b4afSLai Jiangshan }
8525173b4afSLai Jiangshan 
8535cd19aa0SPekka Enberg static void resolve_program(const char *src, char *dst, size_t len)
8545cd19aa0SPekka Enberg {
8555cd19aa0SPekka Enberg 	struct stat st;
856c2c742d9SPekka Enberg 	int err;
8575cd19aa0SPekka Enberg 
858c2c742d9SPekka Enberg 	err = stat(src, &st);
8595cd19aa0SPekka Enberg 
860c2c742d9SPekka Enberg 	if (!err && S_ISREG(st.st_mode)) {
8615cd19aa0SPekka Enberg 		char resolved_path[PATH_MAX];
8625cd19aa0SPekka Enberg 
863de3f75c9SPekka Enberg 		if (!realpath(src, resolved_path))
864de3f75c9SPekka Enberg 			die("Unable to resolve program %s: %s\n", src, strerror(errno));
8655cd19aa0SPekka Enberg 
8665cd19aa0SPekka Enberg 		snprintf(dst, len, "/host%s", resolved_path);
8675cd19aa0SPekka Enberg 	} else
8685cd19aa0SPekka Enberg 		strncpy(dst, src, len);
8695cd19aa0SPekka Enberg }
8705cd19aa0SPekka Enberg 
8713c29e2aaSSasha Levin static void kvm_run_write_sandbox_cmd(const char **argv, int argc)
8723c29e2aaSSasha Levin {
8733c29e2aaSSasha Levin 	const char script_hdr[] = "#! /bin/bash\n\n";
8745cd19aa0SPekka Enberg 	char program[PATH_MAX];
8753c29e2aaSSasha Levin 	int fd;
8763c29e2aaSSasha Levin 
87747621338SSasha Levin 	remove(kvm->cfg.sandbox);
8783c29e2aaSSasha Levin 
87947621338SSasha Levin 	fd = open(kvm->cfg.sandbox, O_RDWR | O_CREAT, 0777);
8803c29e2aaSSasha Levin 	if (fd < 0)
8813c29e2aaSSasha Levin 		die("Failed creating sandbox script");
8823c29e2aaSSasha Levin 
8833c29e2aaSSasha Levin 	if (write(fd, script_hdr, sizeof(script_hdr) - 1) <= 0)
8843c29e2aaSSasha Levin 		die("Failed writing sandbox script");
8853c29e2aaSSasha Levin 
8865cd19aa0SPekka Enberg 	resolve_program(argv[0], program, PATH_MAX);
8875cd19aa0SPekka Enberg 	kvm_write_sandbox_cmd_exactly(fd, program);
8885cd19aa0SPekka Enberg 
8895cd19aa0SPekka Enberg 	argv++;
8905cd19aa0SPekka Enberg 	argc--;
8915cd19aa0SPekka Enberg 
8923c29e2aaSSasha Levin 	while (argc) {
8933c29e2aaSSasha Levin 		if (write(fd, " ", 1) <= 0)
8943c29e2aaSSasha Levin 			die("Failed writing sandbox script");
8955cd19aa0SPekka Enberg 
8965cd19aa0SPekka Enberg 		kvm_write_sandbox_cmd_exactly(fd, argv[0]);
8973c29e2aaSSasha Levin 		argv++;
8983c29e2aaSSasha Levin 		argc--;
8993c29e2aaSSasha Levin 	}
9003c29e2aaSSasha Levin 	if (write(fd, "\n", 1) <= 0)
9013c29e2aaSSasha Levin 		die("Failed writing sandbox script");
9023c29e2aaSSasha Levin 
9033c29e2aaSSasha Levin 	close(fd);
9043c29e2aaSSasha Levin }
9053c29e2aaSSasha Levin 
906e1e46fe6SSasha Levin static int kvm_cmd_run_init(int argc, const char **argv)
907f967c427SPrasad Joshi {
9082d96f6b6SSasha Levin 	static char real_cmdline[2048], default_name[20];
909aba1efa5SPekka Enberg 	struct framebuffer *fb = NULL;
910384922b3SPekka Enberg 	unsigned int nr_online_cpus;
9118259b8ccSSasha Levin 	int max_cpus, recommended_cpus;
9124932d174SSasha Levin 	int i, r;
91347621338SSasha Levin 
91447621338SSasha Levin 	kvm = kvm__new();
91547621338SSasha Levin 	if (IS_ERR(kvm))
91647621338SSasha Levin 		return PTR_ERR(kvm);
917f967c427SPrasad Joshi 
9185ee154d1SPekka Enberg 	signal(SIGALRM, handle_sigalrm);
9194b1addaeSSasha Levin 	kvm_ipc__register_handler(KVM_IPC_DEBUG, handle_debug);
92043119af7SPekka Enberg 	signal(SIGUSR1, handle_sigusr1);
9214b1addaeSSasha Levin 	kvm_ipc__register_handler(KVM_IPC_PAUSE, handle_pause);
9224b1addaeSSasha Levin 	kvm_ipc__register_handler(KVM_IPC_RESUME, handle_pause);
9234b1addaeSSasha Levin 	kvm_ipc__register_handler(KVM_IPC_STOP, handle_stop);
9247021c50bSAsias He 	kvm_ipc__register_handler(KVM_IPC_VMSTATE, handle_vmstate);
925f967c427SPrasad Joshi 
926cfd63bbbSSasha Levin 	nr_online_cpus = sysconf(_SC_NPROCESSORS_ONLN);
92747621338SSasha Levin 	kvm->cfg.custom_rootfs_name = "default";
928cfd63bbbSSasha Levin 
929f967c427SPrasad Joshi 	while (argc != 0) {
93047621338SSasha Levin 		BUILD_OPTIONS(options, &kvm->cfg);
931f967c427SPrasad Joshi 		argc = parse_options(argc, argv, options, run_usage,
9321a007c82SSasha Levin 				PARSE_OPT_STOP_AT_NON_OPTION |
9331a007c82SSasha Levin 				PARSE_OPT_KEEP_DASHDASH);
934f967c427SPrasad Joshi 		if (argc != 0) {
9351a007c82SSasha Levin 			/* Cusrom options, should have been handled elsewhere */
9363c29e2aaSSasha Levin 			if (strcmp(argv[0], "--") == 0) {
9373c29e2aaSSasha Levin 				if (kvm_run_wrapper == KVM_RUN_SANDBOX) {
93847621338SSasha Levin 					kvm->cfg.sandbox = DEFAULT_SANDBOX_FILENAME;
9393c29e2aaSSasha Levin 					kvm_run_write_sandbox_cmd(argv+1, argc-1);
9401a007c82SSasha Levin 					break;
9413c29e2aaSSasha Levin 				}
9423c29e2aaSSasha Levin 			}
9431a007c82SSasha Levin 
94447621338SSasha Levin 			if ((kvm_run_wrapper == KVM_RUN_DEFAULT && kvm->cfg.kernel_filename) ||
94547621338SSasha Levin 				(kvm_run_wrapper == KVM_RUN_SANDBOX && kvm->cfg.sandbox)) {
946f967c427SPrasad Joshi 				fprintf(stderr, "Cannot handle parameter: "
947f967c427SPrasad Joshi 						"%s\n", argv[0]);
948f967c427SPrasad Joshi 				usage_with_options(run_usage, options);
94947621338SSasha Levin 				free(kvm);
950e120b624SPaul Neumann 				return -EINVAL;
951f967c427SPrasad Joshi 			}
952e0747665SSasha Levin 			if (kvm_run_wrapper == KVM_RUN_SANDBOX) {
953e0747665SSasha Levin 				/*
954e0747665SSasha Levin 				 * first unhandled parameter is treated as
955e0747665SSasha Levin 				 * sandbox command
956e0747665SSasha Levin 				 */
95747621338SSasha Levin 				kvm->cfg.sandbox = DEFAULT_SANDBOX_FILENAME;
958e0747665SSasha Levin 				kvm_run_write_sandbox_cmd(argv, argc);
959e0747665SSasha Levin 			} else {
960e0747665SSasha Levin 				/*
961e0747665SSasha Levin 				 * first unhandled parameter is treated as a kernel
962e0747665SSasha Levin 				 * image
963f967c427SPrasad Joshi 				 */
96447621338SSasha Levin 				kvm->cfg.kernel_filename = argv[0];
965e0747665SSasha Levin 			}
966f967c427SPrasad Joshi 			argv++;
967f967c427SPrasad Joshi 			argc--;
968f967c427SPrasad Joshi 		}
969f967c427SPrasad Joshi 
970f967c427SPrasad Joshi 	}
971f967c427SPrasad Joshi 
97247621338SSasha Levin 	if (!kvm->cfg.kernel_filename)
97347621338SSasha Levin 		kvm->cfg.kernel_filename = find_kernel();
9748329f30bSPekka Enberg 
97547621338SSasha Levin 	if (!kvm->cfg.kernel_filename) {
976e08c0896SPrasad Joshi 		kernel_usage_with_options();
977e120b624SPaul Neumann 		return -EINVAL;
9788329f30bSPekka Enberg 	}
9798329f30bSPekka Enberg 
98047621338SSasha Levin 	kvm->cfg.vmlinux_filename = find_vmlinux();
981b0b42ba0SPekka Enberg 
982cfd63bbbSSasha Levin 	if (nrcpus == 0)
983cfd63bbbSSasha Levin 		nrcpus = nr_online_cpus;
984d77a9efaSCyrill Gorcunov 
98547621338SSasha Levin 	if (!kvm->cfg.ram_size)
98647621338SSasha Levin 		kvm->cfg.ram_size = get_ram_size(nrcpus);
987fd834defSPekka Enberg 
98847621338SSasha Levin 	if (kvm->cfg.ram_size < MIN_RAM_SIZE_MB)
98947621338SSasha Levin 		die("Not enough memory specified: %lluMB (min %lluMB)", kvm->cfg.ram_size, MIN_RAM_SIZE_MB);
990a2a002f9SIngo Molnar 
99147621338SSasha Levin 	if (kvm->cfg.ram_size > host_ram_size())
99247621338SSasha Levin 		pr_warning("Guest memory size %lluMB exceeds host physical RAM size %lluMB", kvm->cfg.ram_size, host_ram_size());
99360ded003SPekka Enberg 
99447621338SSasha Levin 	kvm->cfg.ram_size <<= MB_SHIFT;
995f967c427SPrasad Joshi 
99647621338SSasha Levin 	if (!kvm->cfg.dev)
99747621338SSasha Levin 		kvm->cfg.dev = DEFAULT_KVM_DEV;
998f967c427SPrasad Joshi 
99947621338SSasha Levin 	if (!kvm->cfg.console)
100047621338SSasha Levin 		kvm->cfg.console = DEFAULT_CONSOLE;
10019aa4a0ebSAsias He 
100247621338SSasha Levin 	if (!strncmp(kvm->cfg.console, "virtio", 6))
1003f967c427SPrasad Joshi 		active_console  = CONSOLE_VIRTIO;
100447621338SSasha Levin 	else if (!strncmp(kvm->cfg.console, "serial", 6))
10059aa4a0ebSAsias He 		active_console  = CONSOLE_8250;
100647621338SSasha Levin 	else if (!strncmp(kvm->cfg.console, "hv", 2))
10073bbc49b6SMatt Evans 		active_console = CONSOLE_HV;
10083bbc49b6SMatt Evans 	else
10093bbc49b6SMatt Evans 		pr_warning("No console!");
1010f967c427SPrasad Joshi 
101147621338SSasha Levin 	if (!kvm->cfg.host_ip)
101247621338SSasha Levin 		kvm->cfg.host_ip = DEFAULT_HOST_ADDR;
10134d67c820SSasha Levin 
101447621338SSasha Levin 	if (!kvm->cfg.guest_ip)
101547621338SSasha Levin 		kvm->cfg.guest_ip = DEFAULT_GUEST_ADDR;
1016bb8ffd2fSAsias He 
101747621338SSasha Levin 	if (!kvm->cfg.guest_mac)
101847621338SSasha Levin 		kvm->cfg.guest_mac = DEFAULT_GUEST_MAC;
1019a4e724ddSSasha Levin 
102047621338SSasha Levin 	if (!kvm->cfg.host_mac)
102147621338SSasha Levin 		kvm->cfg.host_mac = DEFAULT_HOST_MAC;
1022d7098b9bSAsias He 
102347621338SSasha Levin 	if (!kvm->cfg.script)
102447621338SSasha Levin 		kvm->cfg.script = DEFAULT_SCRIPT;
102573b7d038SAmos Kong 
1026f967c427SPrasad Joshi 	term_init();
1027f967c427SPrasad Joshi 
102847621338SSasha Levin 	if (!kvm->cfg.guest_name) {
102947621338SSasha Levin 		if (kvm->cfg.custom_rootfs) {
103047621338SSasha Levin 			kvm->cfg.guest_name = kvm->cfg.custom_rootfs_name;
1031587a4d17SLai Jiangshan 		} else {
10322d96f6b6SSasha Levin 			sprintf(default_name, "guest-%u", getpid());
103347621338SSasha Levin 			kvm->cfg.guest_name = default_name;
10342d96f6b6SSasha Levin 		}
1035587a4d17SLai Jiangshan 	}
10362d96f6b6SSasha Levin 
103747621338SSasha Levin 	r = kvm__init(kvm);
103847621338SSasha Levin 	if (r)
1039d648dbf5SCyrill Gorcunov 		goto fail;
1040f967c427SPrasad Joshi 
1041ea6eeb1cSSasha Levin 	r = ioeventfd__init(kvm);
1042ea6eeb1cSSasha Levin 	if (r < 0) {
1043ea6eeb1cSSasha Levin 		pr_err("ioeventfd__init() failed with error %d\n", r);
1044ea6eeb1cSSasha Levin 		goto fail;
1045ea6eeb1cSSasha Levin 	}
104637f3d50eSSasha Levin 
1047384922b3SPekka Enberg 	max_cpus = kvm__max_cpus(kvm);
10488259b8ccSSasha Levin 	recommended_cpus = kvm__recommended_cpus(kvm);
1049384922b3SPekka Enberg 
1050384922b3SPekka Enberg 	if (nrcpus > max_cpus) {
1051384922b3SPekka Enberg 		printf("  # Limit the number of CPUs to %d\n", max_cpus);
105290c05188SMatt Evans 		nrcpus = max_cpus;
10538259b8ccSSasha Levin 	} else if (nrcpus > recommended_cpus) {
10548259b8ccSSasha Levin 		printf("  # Warning: The maximum recommended amount of VCPUs"
10558259b8ccSSasha Levin 			" is %d\n", recommended_cpus);
1056384922b3SPekka Enberg 	}
1057384922b3SPekka Enberg 
10580c7c14a7SCyrill Gorcunov 	kvm->nrcpus = nrcpus;
10590c7c14a7SCyrill Gorcunov 
1060e2077857SMatt Evans 	/* Alloc one pointer too many, so array ends up 0-terminated */
1061e2077857SMatt Evans 	kvm_cpus = calloc(nrcpus + 1, sizeof(void *));
1062e2077857SMatt Evans 	if (!kvm_cpus)
1063e2077857SMatt Evans 		die("Couldn't allocate array for %d CPUs", nrcpus);
1064e2077857SMatt Evans 
1065e3c4f8aaSSasha Levin 	r = irq__init(kvm);
1066e3c4f8aaSSasha Levin 	if (r < 0) {
1067e3c4f8aaSSasha Levin 		pr_err("irq__init() failed with error %d\n", r);
1068e3c4f8aaSSasha Levin 		goto fail;
1069e3c4f8aaSSasha Levin 	}
107019e6c8b8SMatt Evans 
10716d987703SSasha Levin 	r = pci__init(kvm);
10726d987703SSasha Levin 	if (r < 0) {
10736d987703SSasha Levin 		pr_err("pci__init() failed with error %d\n", r);
10746d987703SSasha Levin 		goto fail;
10756d987703SSasha Levin 	}
1076b91be965SMatt Evans 
10777af40b91SSasha Levin 	r = ioport__init(kvm);
10787af40b91SSasha Levin 	if (r < 0) {
10797af40b91SSasha Levin 		pr_err("ioport__init() failed with error %d\n", r);
10807af40b91SSasha Levin 		goto fail;
10817af40b91SSasha Levin 	}
10827af40b91SSasha Levin 
1083890364f8SCyrill Gorcunov 	/*
1084890364f8SCyrill Gorcunov 	 * vidmode should be either specified
1085890364f8SCyrill Gorcunov 	 * either set by default
1086890364f8SCyrill Gorcunov 	 */
108747621338SSasha Levin 	if (kvm->cfg.vnc || kvm->cfg.sdl) {
1088890364f8SCyrill Gorcunov 		if (vidmode == -1)
1089890364f8SCyrill Gorcunov 			vidmode = 0x312;
109048d9e01aSSasha Levin 	} else {
1091890364f8SCyrill Gorcunov 		vidmode = 0;
109248d9e01aSSasha Levin 	}
1093890364f8SCyrill Gorcunov 
109426c853e4SPrasad Joshi 	memset(real_cmdline, 0, sizeof(real_cmdline));
109547621338SSasha Levin 	kvm__arch_set_cmdline(real_cmdline, kvm->cfg.vnc || kvm->cfg.sdl);
10968e704a7aSMatt Evans 
10978e704a7aSMatt Evans 	if (strlen(real_cmdline) > 0)
1098d74181ccSSasha Levin 		strcat(real_cmdline, " ");
10998e704a7aSMatt Evans 
110047621338SSasha Levin 	if (kvm->cfg.kernel_cmdline)
110147621338SSasha Levin 		strlcat(real_cmdline, kvm->cfg.kernel_cmdline, sizeof(real_cmdline));
110226c853e4SPrasad Joshi 
110347621338SSasha Levin 	if (!kvm->cfg.using_rootfs && !kvm->cfg.disk_image[0].filename && !kvm->cfg.initrd_filename) {
1104c8675741SSasha Levin 		char tmp[PATH_MAX];
11056df1471eSPekka Enberg 
110647621338SSasha Levin 		kvm_setup_create_new(kvm->cfg.custom_rootfs_name);
110747621338SSasha Levin 		kvm_setup_resolv(kvm->cfg.custom_rootfs_name);
1108c8675741SSasha Levin 
11099667701cSPekka Enberg 		snprintf(tmp, PATH_MAX, "%s%s", kvm__get_dir(), "default");
1110c8675741SSasha Levin 		if (virtio_9p__register(kvm, tmp, "/dev/root") < 0)
1111c8675741SSasha Levin 			die("Unable to initialize virtio 9p");
1112c8675741SSasha Levin 		if (virtio_9p__register(kvm, "/", "hostfs") < 0)
1113c8675741SSasha Levin 			die("Unable to initialize virtio 9p");
111447621338SSasha Levin 		kvm->cfg.using_rootfs = kvm->cfg.custom_rootfs = 1;
111526c853e4SPrasad Joshi 	}
111626c853e4SPrasad Joshi 
111747621338SSasha Levin 	if (kvm->cfg.using_rootfs) {
1118ff42603fSSasha Levin 		strcat(real_cmdline, " root=/dev/root rw rootflags=rw,trans=virtio,version=9p2000.L rootfstype=9p");
111947621338SSasha Levin 		if (kvm->cfg.custom_rootfs) {
1120d50fe489SSasha Levin 			kvm_run_set_sandbox();
1121d50fe489SSasha Levin 
1122a8e6b4b9SSasha Levin 			strcat(real_cmdline, " init=/virt/init");
1123d50fe489SSasha Levin 
112447621338SSasha Levin 			if (!kvm->cfg.no_dhcp)
1125a8e6b4b9SSasha Levin 				strcat(real_cmdline, "  ip=dhcp");
1126afc2c7c0SAsias He 			if (kvm_setup_guest_init())
1127afc2c7c0SAsias He 				die("Failed to setup init for guest.");
1128a8e6b4b9SSasha Levin 		}
112982d65b5eSSasha Levin 	} else if (!strstr(real_cmdline, "root=")) {
1130ff42603fSSasha Levin 		strlcat(real_cmdline, " root=/dev/vda rw ", sizeof(real_cmdline));
113182d65b5eSSasha Levin 	}
113259aa2d30SSasha Levin 
113347621338SSasha Levin 	if (kvm->cfg.image_count) {
113447621338SSasha Levin 		kvm->nr_disks = kvm->cfg.image_count;
113547621338SSasha Levin 		kvm->disks = disk_image__open_all((struct disk_image_params *)&kvm->cfg.disk_image, kvm->cfg.image_count);
11369f9207c5SSasha Levin 		if (IS_ERR(kvm->disks)) {
11379f9207c5SSasha Levin 			r = PTR_ERR(kvm->disks);
11389f9207c5SSasha Levin 			pr_err("disk_image__open_all() failed with error %ld\n",
11399f9207c5SSasha Levin 					PTR_ERR(kvm->disks));
11409f9207c5SSasha Levin 			goto fail;
11419f9207c5SSasha Levin 		}
1142f967c427SPrasad Joshi 	}
1143c1ed214eSPrasad Joshi 
1144ee8b1456SWanlong Gao 	printf("  # %s run -k %s -m %Lu -c %d --name %s\n", KVM_BINARY_NAME,
114547621338SSasha Levin 		kvm->cfg.kernel_filename, kvm->cfg.ram_size / 1024 / 1024, nrcpus, kvm->cfg.guest_name);
1146471c6facSPekka Enberg 
114747621338SSasha Levin 	if (!kvm->cfg.firmware_filename) {
114847621338SSasha Levin 		if (!kvm__load_kernel(kvm, kvm->cfg.kernel_filename,
114947621338SSasha Levin 				kvm->cfg.initrd_filename, real_cmdline, vidmode))
115047621338SSasha Levin 			die("unable to load kernel %s", kvm->cfg.kernel_filename);
1151f967c427SPrasad Joshi 
115247621338SSasha Levin 		kvm->vmlinux = kvm->cfg.vmlinux_filename;
1153807b77b9SCyrill Gorcunov 		r = symbol_init(kvm);
1154b56f1728SCyrill Gorcunov 		if (r < 0)
1155c4b716ecSPekka Enberg 			pr_debug("symbol_init() failed with error %d\n", r);
11565ad8db5eSPekka Enberg 	}
1157b0b42ba0SPekka Enberg 
1158af7b0868SMatt Evans 	ioport__setup_arch();
1159ac38f433SPekka Enberg 
116020c39545SSasha Levin 	r = rtc__init(kvm);
116120c39545SSasha Levin 	if (r < 0) {
116220c39545SSasha Levin 		pr_err("rtc__init() failed with error %d\n", r);
116320c39545SSasha Levin 		goto fail;
116420c39545SSasha Levin 	}
116564136c1cSPekka Enberg 
116620715a22SSasha Levin 	r = serial8250__init(kvm);
116720715a22SSasha Levin 	if (r < 0) {
116820715a22SSasha Levin 		pr_err("serial__init() failed with error %d\n", r);
116920715a22SSasha Levin 		goto fail;
117020715a22SSasha Levin 	}
1171f967c427SPrasad Joshi 
11729f9207c5SSasha Levin 	r = virtio_blk__init(kvm);
11739f9207c5SSasha Levin 	if (r < 0) {
11749f9207c5SSasha Levin 		pr_err("virtio_blk__init() failed with error %d\n", r);
11759f9207c5SSasha Levin 		goto fail;
11769f9207c5SSasha Levin 	}
11779f9207c5SSasha Levin 
1178a67da3beSAsias He 	r = virtio_scsi_init(kvm);
1179a67da3beSAsias He 	if (r < 0) {
1180a67da3beSAsias He 		pr_err("virtio_scsi_init() failed with error %d\n", r);
1181a67da3beSAsias He 		goto fail;
1182a67da3beSAsias He 	}
1183a67da3beSAsias He 
1184a67da3beSAsias He 
11851621292eSSasha Levin 	if (active_console == CONSOLE_VIRTIO)
1186f967c427SPrasad Joshi 		virtio_console__init(kvm);
1187f967c427SPrasad Joshi 
118847621338SSasha Levin 	if (kvm->cfg.virtio_rng)
118953eca082SSasha Levin 		virtio_rng__init(kvm);
119053eca082SSasha Levin 
119147621338SSasha Levin 	if (kvm->cfg.balloon)
119282d2f21eSSasha Levin 		virtio_bln__init(kvm);
119382d2f21eSSasha Levin 
119447621338SSasha Levin 	if (!kvm->cfg.network)
119547621338SSasha Levin 		kvm->cfg.network = DEFAULT_NETWORK;
11964f56d42cSAsias He 
1197c7838fbdSSasha Levin 	virtio_9p__init(kvm);
1198c7838fbdSSasha Levin 
119947621338SSasha Levin 	for (i = 0; i < kvm->cfg.num_net_devices; i++) {
120047621338SSasha Levin 		kvm->cfg.net_params[i].kvm = kvm;
120147621338SSasha Levin 		virtio_net__init(&kvm->cfg.net_params[i]);
12029a6d73f1SSasha Levin 	}
1203a4e724ddSSasha Levin 
120447621338SSasha Levin 	if (kvm->cfg.num_net_devices == 0 && kvm->cfg.no_net == 0) {
12059a6d73f1SSasha Levin 		struct virtio_net_params net_params;
12069a6d73f1SSasha Levin 
12079a6d73f1SSasha Levin 		net_params = (struct virtio_net_params) {
120847621338SSasha Levin 			.guest_ip	= kvm->cfg.guest_ip,
120947621338SSasha Levin 			.host_ip	= kvm->cfg.host_ip,
12109a6d73f1SSasha Levin 			.kvm		= kvm,
121147621338SSasha Levin 			.script		= kvm->cfg.script,
12129a6d73f1SSasha Levin 			.mode		= NET_MODE_USER,
12139a6d73f1SSasha Levin 		};
121447621338SSasha Levin 		str_to_mac(kvm->cfg.guest_mac, net_params.guest_mac);
121547621338SSasha Levin 		str_to_mac(kvm->cfg.host_mac, net_params.host_mac);
12169a6d73f1SSasha Levin 
1217bdfcfca6SSasha Levin 		virtio_net__init(&net_params);
1218bdfcfca6SSasha Levin 	}
12194f56d42cSAsias He 
1220839051d9SSasha Levin 	kvm__init_ram(kvm);
1221839051d9SSasha Levin 
122257d7832bSMatt Evans #ifdef CONFIG_X86
1223714e5b7fSSasha Levin 	kbd__init(kvm);
122457d7832bSMatt Evans #endif
1225714e5b7fSSasha Levin 
122695d13a52SSasha Levin 	pci_shmem__init(kvm);
122795d13a52SSasha Levin 
122847621338SSasha Levin 	if (kvm->cfg.vnc || kvm->cfg.sdl) {
12293f838fecSPekka Enberg 		fb = vesa__init(kvm);
123048d9e01aSSasha Levin 		if (IS_ERR(fb)) {
123148d9e01aSSasha Levin 			pr_err("vesa__init() failed with error %ld\n", PTR_ERR(fb));
123248d9e01aSSasha Levin 			goto fail;
123348d9e01aSSasha Levin 		}
12343f838fecSPekka Enberg 	}
12353f838fecSPekka Enberg 
123647621338SSasha Levin 	if (kvm->cfg.vnc && fb) {
123748d9e01aSSasha Levin 		r = vnc__init(fb);
123848d9e01aSSasha Levin 		if (r < 0) {
123948d9e01aSSasha Levin 			pr_err("vnc__init() failed with error %d\n", r);
124048d9e01aSSasha Levin 			goto fail;
124148d9e01aSSasha Levin 		}
124248d9e01aSSasha Levin 	}
124348d9e01aSSasha Levin 
124447621338SSasha Levin 	if (kvm->cfg.sdl && fb) {
12453f838fecSPekka Enberg 		sdl__init(fb);
124648d9e01aSSasha Levin 		if (r < 0) {
124748d9e01aSSasha Levin 			pr_err("sdl__init() failed with error %d\n", r);
124848d9e01aSSasha Levin 			goto fail;
124948d9e01aSSasha Levin 		}
12503f838fecSPekka Enberg 	}
1251aba1efa5SPekka Enberg 
125248d9e01aSSasha Levin 	r = fb__start();
125348d9e01aSSasha Levin 	if (r < 0) {
125448d9e01aSSasha Levin 		pr_err("fb__init() failed with error %d\n", r);
125548d9e01aSSasha Levin 		goto fail;
125648d9e01aSSasha Levin 	}
1257aba1efa5SPekka Enberg 
125825af47eeSMatt Evans 	/* Device init all done; firmware init must
125925af47eeSMatt Evans 	 * come after this (it may set up device trees etc.)
126025af47eeSMatt Evans 	 */
126125af47eeSMatt Evans 
126225af47eeSMatt Evans 	kvm__start_timer(kvm);
126325af47eeSMatt Evans 
126447621338SSasha Levin 	if (kvm->cfg.firmware_filename) {
126547621338SSasha Levin 		if (!kvm__load_firmware(kvm, kvm->cfg.firmware_filename))
126647621338SSasha Levin 			die("unable to load firmware image %s: %s", kvm->cfg.firmware_filename, strerror(errno));
12675ad8db5eSPekka Enberg 	} else {
1268e1e46fe6SSasha Levin 		kvm__arch_setup_firmware(kvm);
12691add9f73SSasha Levin 		if (r < 0) {
12701add9f73SSasha Levin 			pr_err("kvm__arch_setup_firmware() failed with error %d\n", r);
12711add9f73SSasha Levin 			goto fail;
12721add9f73SSasha Levin 		}
12735ad8db5eSPekka Enberg 	}
127425af47eeSMatt Evans 
127525af47eeSMatt Evans 	for (i = 0; i < nrcpus; i++) {
127625af47eeSMatt Evans 		kvm_cpus[i] = kvm_cpu__init(kvm, i);
127725af47eeSMatt Evans 		if (!kvm_cpus[i])
127825af47eeSMatt Evans 			die("unable to initialize KVM VCPU");
127925af47eeSMatt Evans 	}
128025af47eeSMatt Evans 
1281d60bafe5SSasha Levin 	thread_pool__init(nr_online_cpus);
12824932d174SSasha Levin fail:
12834932d174SSasha Levin 	return r;
1284e1e46fe6SSasha Levin }
1285e1e46fe6SSasha Levin 
1286e1e46fe6SSasha Levin static int kvm_cmd_run_work(void)
1287e1e46fe6SSasha Levin {
1288e1e46fe6SSasha Levin 	int i, r = -1;
1289e1e46fe6SSasha Levin 	void *ret = NULL;
1290e1e46fe6SSasha Levin 
1291839051d9SSasha Levin 	for (i = 0; i < nrcpus; i++) {
1292d77a9efaSCyrill Gorcunov 		if (pthread_create(&kvm_cpus[i]->thread, NULL, kvm_cpu_thread, kvm_cpus[i]) != 0)
12935ee154d1SPekka Enberg 			die("unable to create KVM VCPU thread");
12945ee154d1SPekka Enberg 	}
12955ee154d1SPekka Enberg 
129649e5227dSSasha Levin 	/* Only VCPU #0 is going to exit by itself when shutting down */
129749e5227dSSasha Levin 	if (pthread_join(kvm_cpus[0]->thread, &ret) != 0)
1298e1e46fe6SSasha Levin 		r = 0;
12995ee154d1SPekka Enberg 
130089e0575aSPekka Enberg 	kvm_cpu__delete(kvm_cpus[0]);
130120715a22SSasha Levin 	kvm_cpus[0] = NULL;
130289e0575aSPekka Enberg 
130349e5227dSSasha Levin 	for (i = 1; i < nrcpus; i++) {
1304c23d9748SSasha Levin 		if (kvm_cpus[i]->is_running) {
130549e5227dSSasha Levin 			pthread_kill(kvm_cpus[i]->thread, SIGKVMEXIT);
1306d77a9efaSCyrill Gorcunov 			if (pthread_join(kvm_cpus[i]->thread, &ret) != 0)
13075ee154d1SPekka Enberg 				die("pthread_join");
130889e0575aSPekka Enberg 			kvm_cpu__delete(kvm_cpus[i]);
1309c23d9748SSasha Levin 		}
1310e1e46fe6SSasha Levin 		if (ret == NULL)
1311e1e46fe6SSasha Levin 			r = 0;
13125ee154d1SPekka Enberg 	}
1313f967c427SPrasad Joshi 
1314e1e46fe6SSasha Levin 	return r;
1315e1e46fe6SSasha Levin }
1316e1e46fe6SSasha Levin 
13174932d174SSasha Levin static void kvm_cmd_run_exit(int guest_ret)
1318e1e46fe6SSasha Levin {
13194932d174SSasha Levin 	int r = 0;
13204932d174SSasha Levin 
1321e6694207SSasha Levin 	compat__print_all_messages();
1322e6694207SSasha Levin 
1323807b77b9SCyrill Gorcunov 	r = symbol_exit(kvm);
13244932d174SSasha Levin 	if (r < 0)
1325807b77b9SCyrill Gorcunov 		pr_warning("symbol_exit() failed with error %d\n", r);
13264932d174SSasha Levin 
1327e3c4f8aaSSasha Levin 	r = irq__exit(kvm);
1328e3c4f8aaSSasha Levin 	if (r < 0)
1329e3c4f8aaSSasha Levin 		pr_warning("irq__exit() failed with error %d\n", r);
1330e3c4f8aaSSasha Levin 
1331aba1efa5SPekka Enberg 	fb__stop();
1332aba1efa5SPekka Enberg 
1333a67da3beSAsias He 	r = virtio_scsi_exit(kvm);
1334a67da3beSAsias He 	if (r < 0)
1335a67da3beSAsias He 		pr_warning("virtio_scsi_exit() failed with error %d\n", r);
1336a67da3beSAsias He 
13379f9207c5SSasha Levin 	r = virtio_blk__exit(kvm);
13389f9207c5SSasha Levin 	if (r < 0)
13399f9207c5SSasha Levin 		pr_warning("virtio_blk__exit() failed with error %d\n", r);
13409f9207c5SSasha Levin 
1341495fbd4eSSasha Levin 	r = virtio_rng__exit(kvm);
1342495fbd4eSSasha Levin 	if (r < 0)
1343495fbd4eSSasha Levin 		pr_warning("virtio_rng__exit() failed with error %d\n", r);
1344a0a1e3c2SPrasad Joshi 
134547621338SSasha Levin 	r = disk_image__close_all(kvm->disks, kvm->cfg.image_count);
13469f9207c5SSasha Levin 	if (r < 0)
13479f9207c5SSasha Levin 		pr_warning("disk_image__close_all() failed with error %d\n", r);
13487af40b91SSasha Levin 
134920715a22SSasha Levin 	r = serial8250__exit(kvm);
135020715a22SSasha Levin 	if (r < 0)
135120715a22SSasha Levin 		pr_warning("serial8250__exit() failed with error %d\n", r);
135220715a22SSasha Levin 
135320c39545SSasha Levin 	r = rtc__exit(kvm);
135420c39545SSasha Levin 	if (r < 0)
135520c39545SSasha Levin 		pr_warning("rtc__exit() failed with error %d\n", r);
135620c39545SSasha Levin 
13571add9f73SSasha Levin 	r = kvm__arch_free_firmware(kvm);
13581add9f73SSasha Levin 	if (r < 0)
13591add9f73SSasha Levin 		pr_warning("kvm__arch_free_firmware() failed with error %d\n", r);
13601add9f73SSasha Levin 
13617af40b91SSasha Levin 	r = ioport__exit(kvm);
13627af40b91SSasha Levin 	if (r < 0)
13637af40b91SSasha Levin 		pr_warning("ioport__exit() failed with error %d\n", r);
13647af40b91SSasha Levin 
1365ea6eeb1cSSasha Levin 	r = ioeventfd__exit(kvm);
1366ea6eeb1cSSasha Levin 	if (r < 0)
1367ea6eeb1cSSasha Levin 		pr_warning("ioeventfd__exit() failed with error %d\n", r);
1368ea6eeb1cSSasha Levin 
13696d987703SSasha Levin 	r = pci__exit(kvm);
13706d987703SSasha Levin 	if (r < 0)
13716d987703SSasha Levin 		pr_warning("pci__exit() failed with error %d\n", r);
13726d987703SSasha Levin 
1373495fbd4eSSasha Levin 	r = kvm__exit(kvm);
1374495fbd4eSSasha Levin 	if (r < 0)
1375495fbd4eSSasha Levin 		pr_warning("pci__exit() failed with error %d\n", r);
1376f967c427SPrasad Joshi 
137749777800SPekka Enberg 	free(kvm_cpus);
137849777800SPekka Enberg 
1379e1e46fe6SSasha Levin 	if (guest_ret == 0)
1380f967c427SPrasad Joshi 		printf("\n  # KVM session ended normally.\n");
1381e1e46fe6SSasha Levin }
1382e1e46fe6SSasha Levin 
1383e1e46fe6SSasha Levin int kvm_cmd_run(int argc, const char **argv, const char *prefix)
1384e1e46fe6SSasha Levin {
13854932d174SSasha Levin 	int r, ret = -EFAULT;
1386e1e46fe6SSasha Levin 
1387e1e46fe6SSasha Levin 	r = kvm_cmd_run_init(argc, argv);
1388e1e46fe6SSasha Levin 	if (r < 0)
1389e1e46fe6SSasha Levin 		return r;
1390e1e46fe6SSasha Levin 
1391e1e46fe6SSasha Levin 	ret = kvm_cmd_run_work();
1392e1e46fe6SSasha Levin 	kvm_cmd_run_exit(ret);
1393e1e46fe6SSasha Levin 
1394e1e46fe6SSasha Levin 	return ret;
1395f967c427SPrasad Joshi }
1396