xref: /kvmtool/builtin-run.c (revision 48d9e01a8cfb8541c32c1dd46fa9d34fc687b031)
1ece09f8fSPekka Enberg #include "kvm/builtin-run.h"
2ece09f8fSPekka Enberg 
3c8675741SSasha Levin #include "kvm/builtin-setup.h"
4ece09f8fSPekka Enberg #include "kvm/virtio-balloon.h"
5ece09f8fSPekka Enberg #include "kvm/virtio-console.h"
6ece09f8fSPekka Enberg #include "kvm/parse-options.h"
7ece09f8fSPekka Enberg #include "kvm/8250-serial.h"
8ece09f8fSPekka Enberg #include "kvm/framebuffer.h"
9ece09f8fSPekka Enberg #include "kvm/disk-image.h"
10ece09f8fSPekka Enberg #include "kvm/threadpool.h"
11ece09f8fSPekka Enberg #include "kvm/virtio-blk.h"
12ece09f8fSPekka Enberg #include "kvm/virtio-net.h"
13ece09f8fSPekka Enberg #include "kvm/virtio-rng.h"
14ece09f8fSPekka Enberg #include "kvm/ioeventfd.h"
15ece09f8fSPekka Enberg #include "kvm/virtio-9p.h"
16ece09f8fSPekka Enberg #include "kvm/barrier.h"
17ece09f8fSPekka Enberg #include "kvm/kvm-cpu.h"
18ece09f8fSPekka Enberg #include "kvm/ioport.h"
19ece09f8fSPekka Enberg #include "kvm/symbol.h"
20ece09f8fSPekka Enberg #include "kvm/i8042.h"
21ece09f8fSPekka Enberg #include "kvm/mutex.h"
22ece09f8fSPekka Enberg #include "kvm/term.h"
23ece09f8fSPekka Enberg #include "kvm/util.h"
24ec52d504SLai Jiangshan #include "kvm/strbuf.h"
25ece09f8fSPekka Enberg #include "kvm/vesa.h"
26ece09f8fSPekka Enberg #include "kvm/irq.h"
27ece09f8fSPekka Enberg #include "kvm/kvm.h"
28ece09f8fSPekka Enberg #include "kvm/pci.h"
29ece09f8fSPekka Enberg #include "kvm/rtc.h"
30ece09f8fSPekka Enberg #include "kvm/sdl.h"
31ece09f8fSPekka Enberg #include "kvm/vnc.h"
32e6694207SSasha Levin #include "kvm/guest_compat.h"
3395d13a52SSasha Levin #include "kvm/pci-shmem.h"
344b1addaeSSasha Levin #include "kvm/kvm-ipc.h"
354b1c6f6eSSasha Levin #include "kvm/builtin-debug.h"
36ece09f8fSPekka Enberg 
37ece09f8fSPekka Enberg #include <linux/types.h>
38*48d9e01aSSasha Levin #include <linux/err.h>
39ece09f8fSPekka Enberg 
408329f30bSPekka Enberg #include <sys/utsname.h>
418329f30bSPekka Enberg #include <sys/types.h>
428329f30bSPekka Enberg #include <sys/stat.h>
43ece09f8fSPekka Enberg #include <termios.h>
44ece09f8fSPekka Enberg #include <signal.h>
45ece09f8fSPekka Enberg #include <stdlib.h>
46ece09f8fSPekka Enberg #include <string.h>
47ece09f8fSPekka Enberg #include <unistd.h>
4826c853e4SPrasad Joshi #include <ctype.h>
49ece09f8fSPekka Enberg #include <stdio.h>
50f967c427SPrasad Joshi 
51f967c427SPrasad Joshi #define DEFAULT_KVM_DEV		"/dev/kvm"
529aa4a0ebSAsias He #define DEFAULT_CONSOLE		"serial"
53bd30e200SAsias He #define DEFAULT_NETWORK		"user"
54745c7231SAsias He #define DEFAULT_HOST_ADDR	"192.168.33.1"
55bb8ffd2fSAsias He #define DEFAULT_GUEST_ADDR	"192.168.33.15"
567c88c87eSSasha Levin #define DEFAULT_GUEST_MAC	"02:15:15:15:15:15"
577c88c87eSSasha Levin #define DEFAULT_HOST_MAC	"02:01:01:01:01:01"
5873b7d038SAmos Kong #define DEFAULT_SCRIPT		"none"
593c29e2aaSSasha Levin const char *DEFAULT_SANDBOX_FILENAME = "guest/sandbox.sh";
60f967c427SPrasad Joshi 
61f967c427SPrasad Joshi #define MB_SHIFT		(20)
6295d13a52SSasha Levin #define KB_SHIFT		(10)
6395d13a52SSasha Levin #define GB_SHIFT		(30)
64a2a002f9SIngo Molnar #define MIN_RAM_SIZE_MB		(64ULL)
65f967c427SPrasad Joshi #define MIN_RAM_SIZE_BYTE	(MIN_RAM_SIZE_MB << MB_SHIFT)
66f967c427SPrasad Joshi 
674298ddadSSasha Levin struct kvm *kvm;
68e2077857SMatt Evans struct kvm_cpu **kvm_cpus;
69656be1b8SSasha Levin __thread struct kvm_cpu *current_kvm_cpu;
70f967c427SPrasad Joshi 
71fd834defSPekka Enberg static u64 ram_size;
72a33979d8SSasha Levin static u8  image_count;
739a6d73f1SSasha Levin static u8 num_net_devices;
74cf55d6aeSLiming Wang static bool virtio_rng;
75f967c427SPrasad Joshi static const char *kernel_cmdline;
76f967c427SPrasad Joshi static const char *kernel_filename;
77b0b42ba0SPekka Enberg static const char *vmlinux_filename;
78f967c427SPrasad Joshi static const char *initrd_filename;
79a33979d8SSasha Levin static const char *image_filename[MAX_DISK_IMAGES];
809aa4a0ebSAsias He static const char *console;
815929637bSAsias He static const char *dev;
824f56d42cSAsias He static const char *network;
83e80ddf6aSAsias He static const char *host_ip;
84bb8ffd2fSAsias He static const char *guest_ip;
85a4e724ddSSasha Levin static const char *guest_mac;
86d7098b9bSAsias He static const char *host_mac;
8773b7d038SAmos Kong static const char *script;
885358b0e6SSasha Levin static const char *guest_name;
89d50fe489SSasha Levin static const char *sandbox;
9061061257SMatt Evans static const char *hugetlbfs_path;
91cb540c93SSasha Levin static const char *custom_rootfs_name = "default";
929a6d73f1SSasha Levin static struct virtio_net_params *net_params;
930ea58e5bSPekka Enberg static bool single_step;
94a33979d8SSasha Levin static bool readonly_image[MAX_DISK_IMAGES];
955ffd4178SJohn Floren static bool vnc;
963f838fecSPekka Enberg static bool sdl;
9782d2f21eSSasha Levin static bool balloon;
9859aa2d30SSasha Levin static bool using_rootfs;
9982d65b5eSSasha Levin static bool custom_rootfs;
1009a6d73f1SSasha Levin static bool no_net;
101a8e6b4b9SSasha Levin static bool no_dhcp;
102f967c427SPrasad Joshi extern bool ioport_debug;
1033c29e2aaSSasha Levin static int  kvm_run_wrapper;
104f967c427SPrasad Joshi extern int  active_console;
105aa400b00SPrasad Joshi extern int  debug_iodelay;
106f967c427SPrasad Joshi 
107ed036f03SCyrill Gorcunov bool do_debug_print = false;
108ed036f03SCyrill Gorcunov 
109cfd63bbbSSasha Levin static int nrcpus;
110890364f8SCyrill Gorcunov static int vidmode = -1;
111d77a9efaSCyrill Gorcunov 
112f967c427SPrasad Joshi static const char * const run_usage[] = {
1138d2ff5daSWanlong Gao 	"lkvm run [<options>] [<kernel image>]",
114f967c427SPrasad Joshi 	NULL
115f967c427SPrasad Joshi };
116f967c427SPrasad Joshi 
1173c29e2aaSSasha Levin enum {
118e0747665SSasha Levin 	KVM_RUN_DEFAULT,
1193c29e2aaSSasha Levin 	KVM_RUN_SANDBOX,
1203c29e2aaSSasha Levin };
1213c29e2aaSSasha Levin 
1223c29e2aaSSasha Levin void kvm_run_set_wrapper_sandbox(void)
1233c29e2aaSSasha Levin {
1243c29e2aaSSasha Levin 	kvm_run_wrapper = KVM_RUN_SANDBOX;
1253c29e2aaSSasha Levin }
1263c29e2aaSSasha Levin 
127a33979d8SSasha Levin static int img_name_parser(const struct option *opt, const char *arg, int unset)
128a33979d8SSasha Levin {
129a33979d8SSasha Levin 	char *sep;
13059aa2d30SSasha Levin 	struct stat st;
13182d65b5eSSasha Levin 	char path[PATH_MAX];
13259aa2d30SSasha Levin 
13359aa2d30SSasha Levin 	if (stat(arg, &st) == 0 &&
13459aa2d30SSasha Levin 	    S_ISDIR(st.st_mode)) {
13559aa2d30SSasha Levin 		char tmp[PATH_MAX];
13659aa2d30SSasha Levin 
1372c908af9SLai Jiangshan 		if (using_rootfs)
1382c908af9SLai Jiangshan 			die("Please use only one rootfs directory atmost");
1392c908af9SLai Jiangshan 
14059aa2d30SSasha Levin 		if (realpath(arg, tmp) == 0 ||
141c7838fbdSSasha Levin 		    virtio_9p__register(kvm, tmp, "/dev/root") < 0)
14259aa2d30SSasha Levin 			die("Unable to initialize virtio 9p");
14359aa2d30SSasha Levin 		using_rootfs = 1;
14459aa2d30SSasha Levin 		return 0;
14559aa2d30SSasha Levin 	}
146a33979d8SSasha Levin 
1479667701cSPekka Enberg 	snprintf(path, PATH_MAX, "%s%s", kvm__get_dir(), arg);
14882d65b5eSSasha Levin 
14982d65b5eSSasha Levin 	if (stat(path, &st) == 0 &&
15082d65b5eSSasha Levin 	    S_ISDIR(st.st_mode)) {
15182d65b5eSSasha Levin 		char tmp[PATH_MAX];
15282d65b5eSSasha Levin 
1532c908af9SLai Jiangshan 		if (using_rootfs)
1542c908af9SLai Jiangshan 			die("Please use only one rootfs directory atmost");
1552c908af9SLai Jiangshan 
15682d65b5eSSasha Levin 		if (realpath(path, tmp) == 0 ||
15782d65b5eSSasha Levin 		    virtio_9p__register(kvm, tmp, "/dev/root") < 0)
15882d65b5eSSasha Levin 			die("Unable to initialize virtio 9p");
15982d65b5eSSasha Levin 		if (virtio_9p__register(kvm, "/", "hostfs") < 0)
16082d65b5eSSasha Levin 			die("Unable to initialize virtio 9p");
16169c88b95SSasha Levin 		kvm_setup_resolv(arg);
16282d65b5eSSasha Levin 		using_rootfs = custom_rootfs = 1;
163cb540c93SSasha Levin 		custom_rootfs_name = arg;
16482d65b5eSSasha Levin 		return 0;
16582d65b5eSSasha Levin 	}
16682d65b5eSSasha Levin 
167a33979d8SSasha Levin 	if (image_count >= MAX_DISK_IMAGES)
168a33979d8SSasha Levin 		die("Currently only 4 images are supported");
169a33979d8SSasha Levin 
170a33979d8SSasha Levin 	image_filename[image_count] = arg;
171a33979d8SSasha Levin 	sep = strstr(arg, ",");
172a33979d8SSasha Levin 	if (sep) {
173a33979d8SSasha Levin 		if (strcmp(sep + 1, "ro") == 0)
174a33979d8SSasha Levin 			readonly_image[image_count] = 1;
175a33979d8SSasha Levin 		*sep = 0;
176a33979d8SSasha Levin 	}
177a33979d8SSasha Levin 
178a33979d8SSasha Levin 	image_count++;
179a33979d8SSasha Levin 
180a33979d8SSasha Levin 	return 0;
181a33979d8SSasha Levin }
182a33979d8SSasha Levin 
183b4422bf3SAneesh Kumar K.V static int virtio_9p_rootdir_parser(const struct option *opt, const char *arg, int unset)
184b4422bf3SAneesh Kumar K.V {
185b4422bf3SAneesh Kumar K.V 	char *tag_name;
186b4422bf3SAneesh Kumar K.V 	char tmp[PATH_MAX];
187b4422bf3SAneesh Kumar K.V 
188b4422bf3SAneesh Kumar K.V 	/*
189b4422bf3SAneesh Kumar K.V 	 * 9p dir can be of the form dirname,tag_name or
190b4422bf3SAneesh Kumar K.V 	 * just dirname. In the later case we use the
191b4422bf3SAneesh Kumar K.V 	 * default tag name
192b4422bf3SAneesh Kumar K.V 	 */
193b4422bf3SAneesh Kumar K.V 	tag_name = strstr(arg, ",");
194b4422bf3SAneesh Kumar K.V 	if (tag_name) {
195b4422bf3SAneesh Kumar K.V 		*tag_name = '\0';
196b4422bf3SAneesh Kumar K.V 		tag_name++;
197b4422bf3SAneesh Kumar K.V 	}
19854f6802dSPekka Enberg 	if (realpath(arg, tmp)) {
199c7838fbdSSasha Levin 		if (virtio_9p__register(kvm, tmp, tag_name) < 0)
20054f6802dSPekka Enberg 			die("Unable to initialize virtio 9p");
20154f6802dSPekka Enberg 	} else
202b4422bf3SAneesh Kumar K.V 		die("Failed resolving 9p path");
203b4422bf3SAneesh Kumar K.V 	return 0;
204b4422bf3SAneesh Kumar K.V }
205b4422bf3SAneesh Kumar K.V 
2061add4b76SSasha Levin static int tty_parser(const struct option *opt, const char *arg, int unset)
2071add4b76SSasha Levin {
2081add4b76SSasha Levin 	int tty = atoi(arg);
2091add4b76SSasha Levin 
2101add4b76SSasha Levin 	term_set_tty(tty);
2111add4b76SSasha Levin 
2121add4b76SSasha Levin 	return 0;
2131add4b76SSasha Levin }
2141add4b76SSasha Levin 
2159a6d73f1SSasha Levin static inline void str_to_mac(const char *str, char *mac)
2169a6d73f1SSasha Levin {
2179a6d73f1SSasha Levin 	sscanf(str, "%hhx:%hhx:%hhx:%hhx:%hhx:%hhx",
2189a6d73f1SSasha Levin 		mac, mac+1, mac+2, mac+3, mac+4, mac+5);
2199a6d73f1SSasha Levin }
2209a6d73f1SSasha Levin static int set_net_param(struct virtio_net_params *p, const char *param,
2219a6d73f1SSasha Levin 				const char *val)
2229a6d73f1SSasha Levin {
2239a6d73f1SSasha Levin 	if (strcmp(param, "guest_mac") == 0) {
2249a6d73f1SSasha Levin 		str_to_mac(val, p->guest_mac);
2259a6d73f1SSasha Levin 	} else if (strcmp(param, "mode") == 0) {
2269a6d73f1SSasha Levin 		if (!strncmp(val, "user", 4)) {
2279a6d73f1SSasha Levin 			int i;
2289a6d73f1SSasha Levin 
2299a6d73f1SSasha Levin 			for (i = 0; i < num_net_devices; i++)
2309a6d73f1SSasha Levin 				if (net_params[i].mode == NET_MODE_USER)
2319a6d73f1SSasha Levin 					die("Only one usermode network device allowed at a time");
2329a6d73f1SSasha Levin 			p->mode = NET_MODE_USER;
2339a6d73f1SSasha Levin 		} else if (!strncmp(val, "tap", 3)) {
2349a6d73f1SSasha Levin 			p->mode = NET_MODE_TAP;
2359a6d73f1SSasha Levin 		} else if (!strncmp(val, "none", 4)) {
2369a6d73f1SSasha Levin 			no_net = 1;
2379a6d73f1SSasha Levin 			return -1;
2389a6d73f1SSasha Levin 		} else
2399a6d73f1SSasha Levin 			die("Unkown network mode %s, please use user, tap or none", network);
2409a6d73f1SSasha Levin 	} else if (strcmp(param, "script") == 0) {
2419a6d73f1SSasha Levin 		p->script = strdup(val);
2429a6d73f1SSasha Levin 	} else if (strcmp(param, "guest_ip") == 0) {
2439a6d73f1SSasha Levin 		p->guest_ip = strdup(val);
2449a6d73f1SSasha Levin 	} else if (strcmp(param, "host_ip") == 0) {
2459a6d73f1SSasha Levin 		p->host_ip = strdup(val);
2469ed67cdcSSasha Levin 	} else if (strcmp(param, "vhost") == 0) {
2479ed67cdcSSasha Levin 		p->vhost = atoi(val);
248f19edd1eSSasha Levin 	} else if (strcmp(param, "fd") == 0) {
249f19edd1eSSasha Levin 		p->fd = atoi(val);
2509a6d73f1SSasha Levin 	}
2519a6d73f1SSasha Levin 
2529a6d73f1SSasha Levin 	return 0;
2539a6d73f1SSasha Levin }
2549a6d73f1SSasha Levin 
2559a6d73f1SSasha Levin static int netdev_parser(const struct option *opt, const char *arg, int unset)
2569a6d73f1SSasha Levin {
2579a6d73f1SSasha Levin 	struct virtio_net_params p;
2589a6d73f1SSasha Levin 	char *buf = NULL, *cmd = NULL, *cur = NULL;
2599a6d73f1SSasha Levin 	bool on_cmd = true;
2609a6d73f1SSasha Levin 
2619a6d73f1SSasha Levin 	if (arg) {
2629a6d73f1SSasha Levin 		buf = strdup(arg);
2639a6d73f1SSasha Levin 		if (buf == NULL)
2649a6d73f1SSasha Levin 			die("Failed allocating new net buffer");
2659a6d73f1SSasha Levin 		cur = strtok(buf, ",=");
2669a6d73f1SSasha Levin 	}
2679a6d73f1SSasha Levin 
2689a6d73f1SSasha Levin 	p = (struct virtio_net_params) {
2699a6d73f1SSasha Levin 		.guest_ip	= DEFAULT_GUEST_ADDR,
2709a6d73f1SSasha Levin 		.host_ip	= DEFAULT_HOST_ADDR,
2719a6d73f1SSasha Levin 		.script		= DEFAULT_SCRIPT,
2729a6d73f1SSasha Levin 		.mode		= NET_MODE_TAP,
2739a6d73f1SSasha Levin 	};
2749a6d73f1SSasha Levin 
2759a6d73f1SSasha Levin 	str_to_mac(DEFAULT_GUEST_MAC, p.guest_mac);
2769a6d73f1SSasha Levin 	p.guest_mac[5] += num_net_devices;
2779a6d73f1SSasha Levin 
2789a6d73f1SSasha Levin 	while (cur) {
2799a6d73f1SSasha Levin 		if (on_cmd) {
2809a6d73f1SSasha Levin 			cmd = cur;
2819a6d73f1SSasha Levin 		} else {
2829a6d73f1SSasha Levin 			if (set_net_param(&p, cmd, cur) < 0)
2839a6d73f1SSasha Levin 				goto done;
2849a6d73f1SSasha Levin 		}
2859a6d73f1SSasha Levin 		on_cmd = !on_cmd;
2869a6d73f1SSasha Levin 
2879a6d73f1SSasha Levin 		cur = strtok(NULL, ",=");
2889a6d73f1SSasha Levin 	};
2899a6d73f1SSasha Levin 
2909a6d73f1SSasha Levin 	num_net_devices++;
2919a6d73f1SSasha Levin 
2929a6d73f1SSasha Levin 	net_params = realloc(net_params, num_net_devices * sizeof(*net_params));
2939a6d73f1SSasha Levin 	if (net_params == NULL)
2949a6d73f1SSasha Levin 		die("Failed adding new network device");
2959a6d73f1SSasha Levin 
2969a6d73f1SSasha Levin 	net_params[num_net_devices - 1] = p;
2979a6d73f1SSasha Levin 
2989a6d73f1SSasha Levin done:
2999a6d73f1SSasha Levin 	free(buf);
3009a6d73f1SSasha Levin 	return 0;
3019a6d73f1SSasha Levin }
3029a6d73f1SSasha Levin 
30395d13a52SSasha Levin static int shmem_parser(const struct option *opt, const char *arg, int unset)
30495d13a52SSasha Levin {
30572f1ad6dSSasha Levin 	const u64 default_size = SHMEM_DEFAULT_SIZE;
30672f1ad6dSSasha Levin 	const u64 default_phys_addr = SHMEM_DEFAULT_ADDR;
30795d13a52SSasha Levin 	const char *default_handle = SHMEM_DEFAULT_HANDLE;
30895d13a52SSasha Levin 	struct shmem_info *si = malloc(sizeof(struct shmem_info));
30972f1ad6dSSasha Levin 	u64 phys_addr;
31072f1ad6dSSasha Levin 	u64 size;
31195d13a52SSasha Levin 	char *handle = NULL;
31295d13a52SSasha Levin 	int create = 0;
31395d13a52SSasha Levin 	const char *p = arg;
31495d13a52SSasha Levin 	char *next;
31595d13a52SSasha Levin 	int base = 10;
31695d13a52SSasha Levin 	int verbose = 0;
31795d13a52SSasha Levin 
31895d13a52SSasha Levin 	const int skip_pci = strlen("pci:");
31995d13a52SSasha Levin 	if (verbose)
32095d13a52SSasha Levin 		pr_info("shmem_parser(%p,%s,%d)", opt, arg, unset);
32195d13a52SSasha Levin 	/* parse out optional addr family */
32295d13a52SSasha Levin 	if (strcasestr(p, "pci:")) {
32395d13a52SSasha Levin 		p += skip_pci;
32495d13a52SSasha Levin 	} else if (strcasestr(p, "mem:")) {
32595d13a52SSasha Levin 		die("I can't add to E820 map yet.\n");
32695d13a52SSasha Levin 	}
32795d13a52SSasha Levin 	/* parse out physical addr */
32895d13a52SSasha Levin 	base = 10;
32995d13a52SSasha Levin 	if (strcasestr(p, "0x"))
33095d13a52SSasha Levin 		base = 16;
33195d13a52SSasha Levin 	phys_addr = strtoll(p, &next, base);
33295d13a52SSasha Levin 	if (next == p && phys_addr == 0) {
33395d13a52SSasha Levin 		pr_info("shmem: no physical addr specified, using default.");
33495d13a52SSasha Levin 		phys_addr = default_phys_addr;
33595d13a52SSasha Levin 	}
33695d13a52SSasha Levin 	if (*next != ':' && *next != '\0')
33795d13a52SSasha Levin 		die("shmem: unexpected chars after phys addr.\n");
33895d13a52SSasha Levin 	if (*next == '\0')
33995d13a52SSasha Levin 		p = next;
34095d13a52SSasha Levin 	else
34195d13a52SSasha Levin 		p = next + 1;
34295d13a52SSasha Levin 	/* parse out size */
34395d13a52SSasha Levin 	base = 10;
34495d13a52SSasha Levin 	if (strcasestr(p, "0x"))
34595d13a52SSasha Levin 		base = 16;
34695d13a52SSasha Levin 	size = strtoll(p, &next, base);
34795d13a52SSasha Levin 	if (next == p && size == 0) {
34895d13a52SSasha Levin 		pr_info("shmem: no size specified, using default.");
34995d13a52SSasha Levin 		size = default_size;
35095d13a52SSasha Levin 	}
35195d13a52SSasha Levin 	/* look for [KMGkmg][Bb]*  uses base 2. */
35295d13a52SSasha Levin 	int skip_B = 0;
35395d13a52SSasha Levin 	if (strspn(next, "KMGkmg")) {	/* might have a prefix */
35495d13a52SSasha Levin 		if (*(next + 1) == 'B' || *(next + 1) == 'b')
35595d13a52SSasha Levin 			skip_B = 1;
35695d13a52SSasha Levin 		switch (*next) {
35795d13a52SSasha Levin 		case 'K':
35895d13a52SSasha Levin 		case 'k':
35995d13a52SSasha Levin 			size = size << KB_SHIFT;
36095d13a52SSasha Levin 			break;
36195d13a52SSasha Levin 		case 'M':
36295d13a52SSasha Levin 		case 'm':
36395d13a52SSasha Levin 			size = size << MB_SHIFT;
36495d13a52SSasha Levin 			break;
36595d13a52SSasha Levin 		case 'G':
36695d13a52SSasha Levin 		case 'g':
36795d13a52SSasha Levin 			size = size << GB_SHIFT;
36895d13a52SSasha Levin 			break;
36995d13a52SSasha Levin 		default:
37095d13a52SSasha Levin 			die("shmem: bug in detecting size prefix.");
37195d13a52SSasha Levin 			break;
37295d13a52SSasha Levin 		}
37395d13a52SSasha Levin 		next += 1 + skip_B;
37495d13a52SSasha Levin 	}
37595d13a52SSasha Levin 	if (*next != ':' && *next != '\0') {
37695d13a52SSasha Levin 		die("shmem: unexpected chars after phys size. <%c><%c>\n",
37795d13a52SSasha Levin 		    *next, *p);
37895d13a52SSasha Levin 	}
37995d13a52SSasha Levin 	if (*next == '\0')
38095d13a52SSasha Levin 		p = next;
38195d13a52SSasha Levin 	else
38295d13a52SSasha Levin 		p = next + 1;
38395d13a52SSasha Levin 	/* parse out optional shmem handle */
38495d13a52SSasha Levin 	const int skip_handle = strlen("handle=");
38595d13a52SSasha Levin 	next = strcasestr(p, "handle=");
38695d13a52SSasha Levin 	if (*p && next) {
38795d13a52SSasha Levin 		if (p != next)
38895d13a52SSasha Levin 			die("unexpected chars before handle\n");
38995d13a52SSasha Levin 		p += skip_handle;
39095d13a52SSasha Levin 		next = strchrnul(p, ':');
39195d13a52SSasha Levin 		if (next - p) {
39295d13a52SSasha Levin 			handle = malloc(next - p + 1);
39395d13a52SSasha Levin 			strncpy(handle, p, next - p);
39495d13a52SSasha Levin 			handle[next - p] = '\0';	/* just in case. */
39595d13a52SSasha Levin 		}
39695d13a52SSasha Levin 		if (*next == '\0')
39795d13a52SSasha Levin 			p = next;
39895d13a52SSasha Levin 		else
39995d13a52SSasha Levin 			p = next + 1;
40095d13a52SSasha Levin 	}
40195d13a52SSasha Levin 	/* parse optional create flag to see if we should create shm seg. */
40295d13a52SSasha Levin 	if (*p && strcasestr(p, "create")) {
40395d13a52SSasha Levin 		create = 1;
40495d13a52SSasha Levin 		p += strlen("create");
40595d13a52SSasha Levin 	}
40695d13a52SSasha Levin 	if (*p != '\0')
40795d13a52SSasha Levin 		die("shmem: unexpected trailing chars\n");
40895d13a52SSasha Levin 	if (handle == NULL) {
40995d13a52SSasha Levin 		handle = malloc(strlen(default_handle) + 1);
41095d13a52SSasha Levin 		strcpy(handle, default_handle);
41195d13a52SSasha Levin 	}
41295d13a52SSasha Levin 	if (verbose) {
41372f1ad6dSSasha Levin 		pr_info("shmem: phys_addr = %llx", phys_addr);
41472f1ad6dSSasha Levin 		pr_info("shmem: size      = %llx", size);
41595d13a52SSasha Levin 		pr_info("shmem: handle    = %s", handle);
41695d13a52SSasha Levin 		pr_info("shmem: create    = %d", create);
41795d13a52SSasha Levin 	}
41895d13a52SSasha Levin 
41995d13a52SSasha Levin 	si->phys_addr = phys_addr;
42095d13a52SSasha Levin 	si->size = size;
42195d13a52SSasha Levin 	si->handle = handle;
42295d13a52SSasha Levin 	si->create = create;
42395d13a52SSasha Levin 	pci_shmem__register_mem(si);	/* ownership of si, etc. passed on. */
42495d13a52SSasha Levin 	return 0;
42595d13a52SSasha Levin }
426b4422bf3SAneesh Kumar K.V 
427f967c427SPrasad Joshi static const struct option options[] = {
4285e3af62dSSasha Levin 	OPT_GROUP("Basic options:"),
4295358b0e6SSasha Levin 	OPT_STRING('\0', "name", &guest_name, "guest name",
4305358b0e6SSasha Levin 			"A name for the guest"),
43180b1f72fSPekka Enberg 	OPT_INTEGER('c', "cpus", &nrcpus, "Number of CPUs"),
432f967c427SPrasad Joshi 	OPT_U64('m', "mem", &ram_size, "Virtual machine memory size in MiB."),
43395d13a52SSasha Levin 	OPT_CALLBACK('\0', "shmem", NULL,
43495d13a52SSasha Levin 		     "[pci:]<addr>:<size>[:handle=<handle>][:create]",
43595d13a52SSasha Levin 		     "Share host shmem with guest via pci device",
43695d13a52SSasha Levin 		     shmem_parser),
437cadb9ab7SAsias He 	OPT_CALLBACK('d', "disk", NULL, "image or rootfs_dir", "Disk image or rootfs directory", img_name_parser),
43882d2f21eSSasha Levin 	OPT_BOOLEAN('\0', "balloon", &balloon, "Enable virtio balloon"),
4395ffd4178SJohn Floren 	OPT_BOOLEAN('\0', "vnc", &vnc, "Enable VNC framebuffer"),
4403f838fecSPekka Enberg 	OPT_BOOLEAN('\0', "sdl", &sdl, "Enable SDL framebuffer"),
441cf55d6aeSLiming Wang 	OPT_BOOLEAN('\0', "rng", &virtio_rng, "Enable virtio Random Number Generator"),
4428b7565e8SAsias He 	OPT_CALLBACK('\0', "9p", NULL, "dir_to_share,tag_name",
4438b7565e8SAsias He 		     "Enable virtio 9p to share files between host and guest", virtio_9p_rootdir_parser),
4443bbc49b6SMatt Evans 	OPT_STRING('\0', "console", &console, "serial, virtio or hv",
4458b7565e8SAsias He 			"Console to use"),
4468b7565e8SAsias He 	OPT_STRING('\0', "dev", &dev, "device_file", "KVM device file"),
4471add4b76SSasha Levin 	OPT_CALLBACK('\0', "tty", NULL, "tty id",
4481add4b76SSasha Levin 		     "Remap guest TTY into a pty on the host",
4491add4b76SSasha Levin 		     tty_parser),
450d50fe489SSasha Levin 	OPT_STRING('\0', "sandbox", &sandbox, "script",
451d50fe489SSasha Levin 			"Run this script when booting into custom rootfs"),
45261061257SMatt Evans 	OPT_STRING('\0', "hugetlbfs", &hugetlbfs_path, "path", "Hugetlbfs path"),
4535e3af62dSSasha Levin 
4545e3af62dSSasha Levin 	OPT_GROUP("Kernel options:"),
4555e3af62dSSasha Levin 	OPT_STRING('k', "kernel", &kernel_filename, "kernel",
4565e3af62dSSasha Levin 			"Kernel to boot in virtual machine"),
457d6c19027SAsias He 	OPT_STRING('i', "initrd", &initrd_filename, "initrd",
4585e3af62dSSasha Levin 			"Initial RAM disk image"),
4595e3af62dSSasha Levin 	OPT_STRING('p', "params", &kernel_cmdline, "params",
4605e3af62dSSasha Levin 			"Kernel command line arguments"),
4615e3af62dSSasha Levin 
4624d67c820SSasha Levin 	OPT_GROUP("Networking options:"),
4639a6d73f1SSasha Levin 	OPT_CALLBACK_DEFAULT('n', "network", NULL, "network params",
4649a6d73f1SSasha Levin 		     "Create a new guest NIC",
4659a6d73f1SSasha Levin 		     netdev_parser, NULL),
466a8e6b4b9SSasha Levin 	OPT_BOOLEAN('\0', "no-dhcp", &no_dhcp, "Disable kernel DHCP in rootfs mode"),
467d6c19027SAsias He 
468890364f8SCyrill Gorcunov 	OPT_GROUP("BIOS options:"),
469890364f8SCyrill Gorcunov 	OPT_INTEGER('\0', "vidmode", &vidmode,
470890364f8SCyrill Gorcunov 		    "Video mode"),
471890364f8SCyrill Gorcunov 
4725e3af62dSSasha Levin 	OPT_GROUP("Debug options:"),
473ed036f03SCyrill Gorcunov 	OPT_BOOLEAN('\0', "debug", &do_debug_print,
474ed036f03SCyrill Gorcunov 			"Enable debug messages"),
475d6c19027SAsias He 	OPT_BOOLEAN('\0', "debug-single-step", &single_step,
476d6c19027SAsias He 			"Enable single stepping"),
477001690a4SSasha Levin 	OPT_BOOLEAN('\0', "debug-ioport", &ioport_debug,
478d6c19027SAsias He 			"Enable ioport debugging"),
479001690a4SSasha Levin 	OPT_INTEGER('\0', "debug-iodelay", &debug_iodelay,
480aa400b00SPrasad Joshi 			"Delay IO by millisecond"),
481f967c427SPrasad Joshi 	OPT_END()
482f967c427SPrasad Joshi };
483f967c427SPrasad Joshi 
484b5b501ccSIngo Molnar /*
485b5b501ccSIngo Molnar  * Serialize debug printout so that the output of multiple vcpus does not
486b5b501ccSIngo Molnar  * get mixed up:
487b5b501ccSIngo Molnar  */
488cffeab25SIngo Molnar static int printout_done;
489b5b501ccSIngo Molnar 
49043119af7SPekka Enberg static void handle_sigusr1(int sig)
49143119af7SPekka Enberg {
49243119af7SPekka Enberg 	struct kvm_cpu *cpu = current_kvm_cpu;
493b7d2f013SSasha Levin 	int fd = kvm_cpu__get_debug_fd();
49443119af7SPekka Enberg 
4954b1c6f6eSSasha Levin 	if (!cpu || cpu->needs_nmi)
49643119af7SPekka Enberg 		return;
49743119af7SPekka Enberg 
498b7d2f013SSasha Levin 	dprintf(fd, "\n #\n # vCPU #%ld's dump:\n #\n", cpu->cpu_id);
49943119af7SPekka Enberg 	kvm_cpu__show_registers(cpu);
50043119af7SPekka Enberg 	kvm_cpu__show_code(cpu);
50143119af7SPekka Enberg 	kvm_cpu__show_page_tables(cpu);
502b5b501ccSIngo Molnar 	fflush(stdout);
503cffeab25SIngo Molnar 	printout_done = 1;
504cffeab25SIngo Molnar 	mb();
50543119af7SPekka Enberg }
50643119af7SPekka Enberg 
507d94e22b9SSasha Levin /* Pause/resume the guest using SIGUSR2 */
508d94e22b9SSasha Levin static int is_paused;
509d94e22b9SSasha Levin 
5104b1addaeSSasha Levin static void handle_pause(int fd, u32 type, u32 len, u8 *msg)
511d94e22b9SSasha Levin {
5125aa502e4SLai Jiangshan 	if (WARN_ON(len))
5135aa502e4SLai Jiangshan 		return;
5145aa502e4SLai Jiangshan 
5157021c50bSAsias He 	if (type == KVM_IPC_RESUME && is_paused) {
5167021c50bSAsias He 		kvm->vm_state = KVM_VMSTATE_RUNNING;
517d94e22b9SSasha Levin 		kvm__continue();
5187021c50bSAsias He 	} else if (type == KVM_IPC_PAUSE && !is_paused) {
5197021c50bSAsias He 		kvm->vm_state = KVM_VMSTATE_PAUSED;
520d94e22b9SSasha Levin 		kvm__pause();
5217021c50bSAsias He 	} else {
52202317b74SSasha Levin 		return;
5235aa502e4SLai Jiangshan 	}
524d94e22b9SSasha Levin 
525d94e22b9SSasha Levin 	is_paused = !is_paused;
526d94e22b9SSasha Levin }
527d94e22b9SSasha Levin 
5287021c50bSAsias He static void handle_vmstate(int fd, u32 type, u32 len, u8 *msg)
5297021c50bSAsias He {
5307021c50bSAsias He 	int r = 0;
5317021c50bSAsias He 
5327021c50bSAsias He 	if (type == KVM_IPC_VMSTATE)
5337021c50bSAsias He 		r = write(fd, &kvm->vm_state, sizeof(kvm->vm_state));
5347021c50bSAsias He 
5357021c50bSAsias He 	if (r < 0)
5367021c50bSAsias He 		pr_warning("Failed sending VMSTATE");
5377021c50bSAsias He }
5387021c50bSAsias He 
5394b1addaeSSasha Levin static void handle_debug(int fd, u32 type, u32 len, u8 *msg)
5409e854d1aSPekka Enberg {
5419e854d1aSPekka Enberg 	int i;
542a59cdf44SLai Jiangshan 	struct debug_cmd_params *params;
543a59cdf44SLai Jiangshan 	u32 dbg_type;
544a59cdf44SLai Jiangshan 	u32 vcpu;
545a59cdf44SLai Jiangshan 
546a59cdf44SLai Jiangshan 	if (WARN_ON(type != KVM_IPC_DEBUG || len != sizeof(*params)))
547a59cdf44SLai Jiangshan 		return;
548a59cdf44SLai Jiangshan 
549a59cdf44SLai Jiangshan 	params = (void *)msg;
550a59cdf44SLai Jiangshan 	dbg_type = params->dbg_type;
551a59cdf44SLai Jiangshan 	vcpu = params->cpu;
5524b1c6f6eSSasha Levin 
5534b1c6f6eSSasha Levin 	if (dbg_type & KVM_DEBUG_CMD_TYPE_NMI) {
5547070414aSSasha Levin 		if ((int)vcpu >= kvm->nrcpus)
5554b1c6f6eSSasha Levin 			return;
5564b1c6f6eSSasha Levin 
5574b1c6f6eSSasha Levin 		kvm_cpus[vcpu]->needs_nmi = 1;
5584b1c6f6eSSasha Levin 		pthread_kill(kvm_cpus[vcpu]->thread, SIGUSR1);
5594b1c6f6eSSasha Levin 	}
5604b1c6f6eSSasha Levin 
5614b1c6f6eSSasha Levin 	if (!(dbg_type & KVM_DEBUG_CMD_TYPE_DUMP))
5624b1c6f6eSSasha Levin 		return;
5639e854d1aSPekka Enberg 
5649e854d1aSPekka Enberg 	for (i = 0; i < nrcpus; i++) {
5659e854d1aSPekka Enberg 		struct kvm_cpu *cpu = kvm_cpus[i];
5669e854d1aSPekka Enberg 
56743119af7SPekka Enberg 		if (!cpu)
56843119af7SPekka Enberg 			continue;
56943119af7SPekka Enberg 
570cffeab25SIngo Molnar 		printout_done = 0;
571b7d2f013SSasha Levin 
572b7d2f013SSasha Levin 		kvm_cpu__set_debug_fd(fd);
57343119af7SPekka Enberg 		pthread_kill(cpu->thread, SIGUSR1);
574cffeab25SIngo Molnar 		/*
575cffeab25SIngo Molnar 		 * Wait for the vCPU to dump state before signalling
576cffeab25SIngo Molnar 		 * the next thread. Since this is debug code it does
577cffeab25SIngo Molnar 		 * not matter that we are burning CPU time a bit:
578cffeab25SIngo Molnar 		 */
579cffeab25SIngo Molnar 		while (!printout_done)
580cffeab25SIngo Molnar 			mb();
5819e854d1aSPekka Enberg 	}
5829e854d1aSPekka Enberg 
583b7d2f013SSasha Levin 	close(fd);
584b7d2f013SSasha Levin 
5859e854d1aSPekka Enberg 	serial8250__inject_sysrq(kvm);
5869e854d1aSPekka Enberg }
5879e854d1aSPekka Enberg 
5889e854d1aSPekka Enberg static void handle_sigalrm(int sig)
5899e854d1aSPekka Enberg {
5900b69bdefSMatt Evans 	kvm__arch_periodic_poll(kvm);
5919e854d1aSPekka Enberg }
5929e854d1aSPekka Enberg 
5934b1addaeSSasha Levin static void handle_stop(int fd, u32 type, u32 len, u8 *msg)
594daf4cb5aSSasha Levin {
595e333e41aSLai Jiangshan 	if (WARN_ON(type != KVM_IPC_STOP || len))
596e333e41aSLai Jiangshan 		return;
597e333e41aSLai Jiangshan 
598daf4cb5aSSasha Levin 	kvm_cpu__reboot();
599daf4cb5aSSasha Levin }
600daf4cb5aSSasha Levin 
6015ee154d1SPekka Enberg static void *kvm_cpu_thread(void *arg)
6025ee154d1SPekka Enberg {
603d77a9efaSCyrill Gorcunov 	current_kvm_cpu		= arg;
6045ee154d1SPekka Enberg 
605d77a9efaSCyrill Gorcunov 	if (kvm_cpu__start(current_kvm_cpu))
6065ee154d1SPekka Enberg 		goto panic_kvm;
6075ee154d1SPekka Enberg 
6085ee154d1SPekka Enberg 	return (void *) (intptr_t) 0;
6095ee154d1SPekka Enberg 
6105ee154d1SPekka Enberg panic_kvm:
6113fdf659dSSasha Levin 	fprintf(stderr, "KVM exit reason: %u (\"%s\")\n",
612d77a9efaSCyrill Gorcunov 		current_kvm_cpu->kvm_run->exit_reason,
613d77a9efaSCyrill Gorcunov 		kvm_exit_reasons[current_kvm_cpu->kvm_run->exit_reason]);
614d77a9efaSCyrill Gorcunov 	if (current_kvm_cpu->kvm_run->exit_reason == KVM_EXIT_UNKNOWN)
6155ee154d1SPekka Enberg 		fprintf(stderr, "KVM exit code: 0x%Lu\n",
616d77a9efaSCyrill Gorcunov 			current_kvm_cpu->kvm_run->hw.hardware_exit_reason);
6178e5accedSPekka Enberg 
618b7d2f013SSasha Levin 	kvm_cpu__set_debug_fd(STDOUT_FILENO);
619d77a9efaSCyrill Gorcunov 	kvm_cpu__show_registers(current_kvm_cpu);
620d77a9efaSCyrill Gorcunov 	kvm_cpu__show_code(current_kvm_cpu);
621d77a9efaSCyrill Gorcunov 	kvm_cpu__show_page_tables(current_kvm_cpu);
6225ee154d1SPekka Enberg 
6235ee154d1SPekka Enberg 	return (void *) (intptr_t) 1;
6245ee154d1SPekka Enberg }
6255ee154d1SPekka Enberg 
626e08c0896SPrasad Joshi static char kernel[PATH_MAX];
627b0b42ba0SPekka Enberg 
628b0b42ba0SPekka Enberg static const char *host_kernels[] = {
629e08c0896SPrasad Joshi 	"/boot/vmlinuz",
630e08c0896SPrasad Joshi 	"/boot/bzImage",
631e08c0896SPrasad Joshi 	NULL
632e08c0896SPrasad Joshi };
633b0b42ba0SPekka Enberg 
634b0b42ba0SPekka Enberg static const char *default_kernels[] = {
635e08c0896SPrasad Joshi 	"./bzImage",
636b03af790SKonstantin Khlebnikov 	"arch/" BUILD_ARCH "/boot/bzImage",
637af7b0868SMatt Evans 	"../../arch/" BUILD_ARCH "/boot/bzImage",
638e08c0896SPrasad Joshi 	NULL
639e08c0896SPrasad Joshi };
6408329f30bSPekka Enberg 
641b0b42ba0SPekka Enberg static const char *default_vmlinux[] = {
642b03af790SKonstantin Khlebnikov 	"vmlinux",
643b0b42ba0SPekka Enberg 	"../../../vmlinux",
644b0b42ba0SPekka Enberg 	"../../vmlinux",
645b0b42ba0SPekka Enberg 	NULL
646b0b42ba0SPekka Enberg };
647b0b42ba0SPekka Enberg 
648e08c0896SPrasad Joshi static void kernel_usage_with_options(void)
6498329f30bSPekka Enberg {
650e08c0896SPrasad Joshi 	const char **k;
6518329f30bSPekka Enberg 	struct utsname uts;
652e08c0896SPrasad Joshi 
653e08c0896SPrasad Joshi 	fprintf(stderr, "Fatal: could not find default kernel image in:\n");
65465182f37SPrasad Joshi 	k = &default_kernels[0];
655e08c0896SPrasad Joshi 	while (*k) {
656e08c0896SPrasad Joshi 		fprintf(stderr, "\t%s\n", *k);
657e08c0896SPrasad Joshi 		k++;
658e08c0896SPrasad Joshi 	}
659e08c0896SPrasad Joshi 
660e08c0896SPrasad Joshi 	if (uname(&uts) < 0)
661e08c0896SPrasad Joshi 		return;
662e08c0896SPrasad Joshi 
663e08c0896SPrasad Joshi 	k = &host_kernels[0];
664e08c0896SPrasad Joshi 	while (*k) {
665e08c0896SPrasad Joshi 		if (snprintf(kernel, PATH_MAX, "%s-%s", *k, uts.release) < 0)
666e08c0896SPrasad Joshi 			return;
667e08c0896SPrasad Joshi 		fprintf(stderr, "\t%s\n", kernel);
668e08c0896SPrasad Joshi 		k++;
669e08c0896SPrasad Joshi 	}
670ee8b1456SWanlong Gao 	fprintf(stderr, "\nPlease see '%s run --help' for more options.\n\n",
671ee8b1456SWanlong Gao 		KVM_BINARY_NAME);
672e08c0896SPrasad Joshi }
673e08c0896SPrasad Joshi 
67460ded003SPekka Enberg static u64 host_ram_size(void)
67560ded003SPekka Enberg {
67660ded003SPekka Enberg 	long page_size;
67760ded003SPekka Enberg 	long nr_pages;
67860ded003SPekka Enberg 
67960ded003SPekka Enberg 	nr_pages	= sysconf(_SC_PHYS_PAGES);
680d63c5ce6SPekka Enberg 	if (nr_pages < 0) {
6814542f276SCyrill Gorcunov 		pr_warning("sysconf(_SC_PHYS_PAGES) failed");
682d63c5ce6SPekka Enberg 		return 0;
683d63c5ce6SPekka Enberg 	}
68460ded003SPekka Enberg 
68560ded003SPekka Enberg 	page_size	= sysconf(_SC_PAGE_SIZE);
686d63c5ce6SPekka Enberg 	if (page_size < 0) {
6874542f276SCyrill Gorcunov 		pr_warning("sysconf(_SC_PAGE_SIZE) failed");
688d63c5ce6SPekka Enberg 		return 0;
689d63c5ce6SPekka Enberg 	}
69060ded003SPekka Enberg 
69160ded003SPekka Enberg 	return (nr_pages * page_size) >> MB_SHIFT;
69260ded003SPekka Enberg }
69360ded003SPekka Enberg 
69418bd8c3bSPekka Enberg /*
69518bd8c3bSPekka Enberg  * If user didn't specify how much memory it wants to allocate for the guest,
69618bd8c3bSPekka Enberg  * avoid filling the whole host RAM.
69718bd8c3bSPekka Enberg  */
69818bd8c3bSPekka Enberg #define RAM_SIZE_RATIO		0.8
69918bd8c3bSPekka Enberg 
700fd834defSPekka Enberg static u64 get_ram_size(int nr_cpus)
701fd834defSPekka Enberg {
70206761c76SPekka Enberg 	u64 available;
70306761c76SPekka Enberg 	u64 ram_size;
704fd834defSPekka Enberg 
705fd834defSPekka Enberg 	ram_size	= 64 * (nr_cpus + 3);
706fd834defSPekka Enberg 
70760ded003SPekka Enberg 	available	= host_ram_size() * RAM_SIZE_RATIO;
708d63c5ce6SPekka Enberg 	if (!available)
709d63c5ce6SPekka Enberg 		available = MIN_RAM_SIZE_MB;
710fd834defSPekka Enberg 
711fd834defSPekka Enberg 	if (ram_size > available)
712fd834defSPekka Enberg 		ram_size	= available;
713fd834defSPekka Enberg 
714fd834defSPekka Enberg 	return ram_size;
715fd834defSPekka Enberg }
716fd834defSPekka Enberg 
717e08c0896SPrasad Joshi static const char *find_kernel(void)
718e08c0896SPrasad Joshi {
719e08c0896SPrasad Joshi 	const char **k;
7208329f30bSPekka Enberg 	struct stat st;
721e08c0896SPrasad Joshi 	struct utsname uts;
722e08c0896SPrasad Joshi 
72365182f37SPrasad Joshi 	k = &default_kernels[0];
724e08c0896SPrasad Joshi 	while (*k) {
725e08c0896SPrasad Joshi 		if (stat(*k, &st) < 0 || !S_ISREG(st.st_mode)) {
726e08c0896SPrasad Joshi 			k++;
727e08c0896SPrasad Joshi 			continue;
728e08c0896SPrasad Joshi 		}
729e08c0896SPrasad Joshi 		strncpy(kernel, *k, PATH_MAX);
730e08c0896SPrasad Joshi 		return kernel;
731e08c0896SPrasad Joshi 	}
7328329f30bSPekka Enberg 
7338329f30bSPekka Enberg 	if (uname(&uts) < 0)
7348329f30bSPekka Enberg 		return NULL;
7358329f30bSPekka Enberg 
736e08c0896SPrasad Joshi 	k = &host_kernels[0];
737e08c0896SPrasad Joshi 	while (*k) {
738e08c0896SPrasad Joshi 		if (snprintf(kernel, PATH_MAX, "%s-%s", *k, uts.release) < 0)
7398329f30bSPekka Enberg 			return NULL;
7408329f30bSPekka Enberg 
741e08c0896SPrasad Joshi 		if (stat(kernel, &st) < 0 || !S_ISREG(st.st_mode)) {
742e08c0896SPrasad Joshi 			k++;
743e08c0896SPrasad Joshi 			continue;
744e08c0896SPrasad Joshi 		}
745e08c0896SPrasad Joshi 		return kernel;
7468329f30bSPekka Enberg 
747e08c0896SPrasad Joshi 	}
7488329f30bSPekka Enberg 	return NULL;
7498329f30bSPekka Enberg }
7508329f30bSPekka Enberg 
751b0b42ba0SPekka Enberg static const char *find_vmlinux(void)
752b0b42ba0SPekka Enberg {
753b0b42ba0SPekka Enberg 	const char **vmlinux;
754b0b42ba0SPekka Enberg 
755b0b42ba0SPekka Enberg 	vmlinux = &default_vmlinux[0];
756b0b42ba0SPekka Enberg 	while (*vmlinux) {
757b0b42ba0SPekka Enberg 		struct stat st;
758b0b42ba0SPekka Enberg 
759b0b42ba0SPekka Enberg 		if (stat(*vmlinux, &st) < 0 || !S_ISREG(st.st_mode)) {
760b0b42ba0SPekka Enberg 			vmlinux++;
761b0b42ba0SPekka Enberg 			continue;
762b0b42ba0SPekka Enberg 		}
763b0b42ba0SPekka Enberg 		return *vmlinux;
764b0b42ba0SPekka Enberg 	}
765b0b42ba0SPekka Enberg 	return NULL;
766b0b42ba0SPekka Enberg }
767b0b42ba0SPekka Enberg 
768f6677a1dSAmerigo Wang void kvm_run_help(void)
769f6677a1dSAmerigo Wang {
770f6677a1dSAmerigo Wang 	usage_with_options(run_usage, options);
771f6677a1dSAmerigo Wang }
772f6677a1dSAmerigo Wang 
7739cec19c8SSasha Levin static int kvm_custom_stage2(void)
7749cec19c8SSasha Levin {
7759cec19c8SSasha Levin 	char tmp[PATH_MAX], dst[PATH_MAX], *src;
776cb540c93SSasha Levin 	const char *rootfs = custom_rootfs_name;
7779cec19c8SSasha Levin 	int r;
7789cec19c8SSasha Levin 
7799cec19c8SSasha Levin 	src = realpath("guest/init_stage2", NULL);
7809cec19c8SSasha Levin 	if (src == NULL)
7819cec19c8SSasha Levin 		return -ENOMEM;
7829cec19c8SSasha Levin 
7839cec19c8SSasha Levin 	snprintf(tmp, PATH_MAX, "%s%s/virt/init_stage2", kvm__get_dir(), rootfs);
7849cec19c8SSasha Levin 	remove(tmp);
7859cec19c8SSasha Levin 
7869cec19c8SSasha Levin 	snprintf(dst, PATH_MAX, "/host/%s", src);
7879cec19c8SSasha Levin 	r = symlink(dst, tmp);
7889cec19c8SSasha Levin 	free(src);
7899cec19c8SSasha Levin 
7909cec19c8SSasha Levin 	return r;
7919cec19c8SSasha Levin }
7929cec19c8SSasha Levin 
793d50fe489SSasha Levin static int kvm_run_set_sandbox(void)
794d50fe489SSasha Levin {
795cb540c93SSasha Levin 	const char *guestfs_name = custom_rootfs_name;
796d50fe489SSasha Levin 	char path[PATH_MAX], script[PATH_MAX], *tmp;
797d50fe489SSasha Levin 
798d50fe489SSasha Levin 	snprintf(path, PATH_MAX, "%s%s/virt/sandbox.sh", kvm__get_dir(), guestfs_name);
799d50fe489SSasha Levin 
800d50fe489SSasha Levin 	remove(path);
801d50fe489SSasha Levin 
802d50fe489SSasha Levin 	if (sandbox == NULL)
803d50fe489SSasha Levin 		return 0;
804d50fe489SSasha Levin 
805d50fe489SSasha Levin 	tmp = realpath(sandbox, NULL);
806d50fe489SSasha Levin 	if (tmp == NULL)
807d50fe489SSasha Levin 		return -ENOMEM;
808d50fe489SSasha Levin 
809d50fe489SSasha Levin 	snprintf(script, PATH_MAX, "/host/%s", tmp);
810d50fe489SSasha Levin 	free(tmp);
811d50fe489SSasha Levin 
812d50fe489SSasha Levin 	return symlink(script, path);
813d50fe489SSasha Levin }
814d50fe489SSasha Levin 
8155173b4afSLai Jiangshan static void kvm_write_sandbox_cmd_exactly(int fd, const char *arg)
8165173b4afSLai Jiangshan {
8175173b4afSLai Jiangshan 	const char *single_quote;
8185173b4afSLai Jiangshan 
8195173b4afSLai Jiangshan 	if (!*arg) { /* zero length string */
8205173b4afSLai Jiangshan 		if (write(fd, "''", 2) <= 0)
8215173b4afSLai Jiangshan 			die("Failed writing sandbox script");
8225173b4afSLai Jiangshan 		return;
8235173b4afSLai Jiangshan 	}
8245173b4afSLai Jiangshan 
8255173b4afSLai Jiangshan 	while (*arg) {
8265173b4afSLai Jiangshan 		single_quote = strchrnul(arg, '\'');
8275173b4afSLai Jiangshan 
8285173b4afSLai Jiangshan 		/* write non-single-quote string as #('string') */
8295173b4afSLai Jiangshan 		if (arg != single_quote) {
8305173b4afSLai Jiangshan 			if (write(fd, "'", 1) <= 0 ||
8315173b4afSLai Jiangshan 			    write(fd, arg, single_quote - arg) <= 0 ||
8325173b4afSLai Jiangshan 			    write(fd, "'", 1) <= 0)
8335173b4afSLai Jiangshan 				die("Failed writing sandbox script");
8345173b4afSLai Jiangshan 		}
8355173b4afSLai Jiangshan 
8365173b4afSLai Jiangshan 		/* write single quote as #("'") */
8375173b4afSLai Jiangshan 		if (*single_quote) {
8385173b4afSLai Jiangshan 			if (write(fd, "\"'\"", 3) <= 0)
8395173b4afSLai Jiangshan 				die("Failed writing sandbox script");
8405173b4afSLai Jiangshan 		} else
8415173b4afSLai Jiangshan 			break;
8425173b4afSLai Jiangshan 
8435173b4afSLai Jiangshan 		arg = single_quote + 1;
8445173b4afSLai Jiangshan 	}
8455173b4afSLai Jiangshan }
8465173b4afSLai Jiangshan 
8473c29e2aaSSasha Levin static void kvm_run_write_sandbox_cmd(const char **argv, int argc)
8483c29e2aaSSasha Levin {
8493c29e2aaSSasha Levin 	const char script_hdr[] = "#! /bin/bash\n\n";
8503c29e2aaSSasha Levin 	int fd;
8513c29e2aaSSasha Levin 
8523c29e2aaSSasha Levin 	remove(sandbox);
8533c29e2aaSSasha Levin 
8543c29e2aaSSasha Levin 	fd = open(sandbox, O_RDWR | O_CREAT, 0777);
8553c29e2aaSSasha Levin 	if (fd < 0)
8563c29e2aaSSasha Levin 		die("Failed creating sandbox script");
8573c29e2aaSSasha Levin 
8583c29e2aaSSasha Levin 	if (write(fd, script_hdr, sizeof(script_hdr) - 1) <= 0)
8593c29e2aaSSasha Levin 		die("Failed writing sandbox script");
8603c29e2aaSSasha Levin 
8613c29e2aaSSasha Levin 	while (argc) {
8625173b4afSLai Jiangshan 		kvm_write_sandbox_cmd_exactly(fd, argv[0]);
8633c29e2aaSSasha Levin 		if (argc - 1)
8643c29e2aaSSasha Levin 			if (write(fd, " ", 1) <= 0)
8653c29e2aaSSasha Levin 				die("Failed writing sandbox script");
8663c29e2aaSSasha Levin 		argv++;
8673c29e2aaSSasha Levin 		argc--;
8683c29e2aaSSasha Levin 	}
8693c29e2aaSSasha Levin 	if (write(fd, "\n", 1) <= 0)
8703c29e2aaSSasha Levin 		die("Failed writing sandbox script");
8713c29e2aaSSasha Levin 
8723c29e2aaSSasha Levin 	close(fd);
8733c29e2aaSSasha Levin }
8743c29e2aaSSasha Levin 
875e1e46fe6SSasha Levin static int kvm_cmd_run_init(int argc, const char **argv)
876f967c427SPrasad Joshi {
8772d96f6b6SSasha Levin 	static char real_cmdline[2048], default_name[20];
878aba1efa5SPekka Enberg 	struct framebuffer *fb = NULL;
879384922b3SPekka Enberg 	unsigned int nr_online_cpus;
8808259b8ccSSasha Levin 	int max_cpus, recommended_cpus;
8814932d174SSasha Levin 	int i, r;
882f967c427SPrasad Joshi 
8835ee154d1SPekka Enberg 	signal(SIGALRM, handle_sigalrm);
8844b1addaeSSasha Levin 	kvm_ipc__register_handler(KVM_IPC_DEBUG, handle_debug);
88543119af7SPekka Enberg 	signal(SIGUSR1, handle_sigusr1);
8864b1addaeSSasha Levin 	kvm_ipc__register_handler(KVM_IPC_PAUSE, handle_pause);
8874b1addaeSSasha Levin 	kvm_ipc__register_handler(KVM_IPC_RESUME, handle_pause);
8884b1addaeSSasha Levin 	kvm_ipc__register_handler(KVM_IPC_STOP, handle_stop);
8897021c50bSAsias He 	kvm_ipc__register_handler(KVM_IPC_VMSTATE, handle_vmstate);
890f967c427SPrasad Joshi 
891cfd63bbbSSasha Levin 	nr_online_cpus = sysconf(_SC_NPROCESSORS_ONLN);
892cfd63bbbSSasha Levin 
893f967c427SPrasad Joshi 	while (argc != 0) {
894f967c427SPrasad Joshi 		argc = parse_options(argc, argv, options, run_usage,
8951a007c82SSasha Levin 				PARSE_OPT_STOP_AT_NON_OPTION |
8961a007c82SSasha Levin 				PARSE_OPT_KEEP_DASHDASH);
897f967c427SPrasad Joshi 		if (argc != 0) {
8981a007c82SSasha Levin 			/* Cusrom options, should have been handled elsewhere */
8993c29e2aaSSasha Levin 			if (strcmp(argv[0], "--") == 0) {
9003c29e2aaSSasha Levin 				if (kvm_run_wrapper == KVM_RUN_SANDBOX) {
9013c29e2aaSSasha Levin 					sandbox = DEFAULT_SANDBOX_FILENAME;
9023c29e2aaSSasha Levin 					kvm_run_write_sandbox_cmd(argv+1, argc-1);
9031a007c82SSasha Levin 					break;
9043c29e2aaSSasha Levin 				}
9053c29e2aaSSasha Levin 			}
9061a007c82SSasha Levin 
907e0747665SSasha Levin 			if ((kvm_run_wrapper == KVM_RUN_DEFAULT && kernel_filename) ||
908e0747665SSasha Levin 				(kvm_run_wrapper == KVM_RUN_SANDBOX && sandbox)) {
909f967c427SPrasad Joshi 				fprintf(stderr, "Cannot handle parameter: "
910f967c427SPrasad Joshi 						"%s\n", argv[0]);
911f967c427SPrasad Joshi 				usage_with_options(run_usage, options);
912f967c427SPrasad Joshi 				return EINVAL;
913f967c427SPrasad Joshi 			}
914e0747665SSasha Levin 			if (kvm_run_wrapper == KVM_RUN_SANDBOX) {
915e0747665SSasha Levin 				/*
916e0747665SSasha Levin 				 * first unhandled parameter is treated as
917e0747665SSasha Levin 				 * sandbox command
918e0747665SSasha Levin 				 */
919e0747665SSasha Levin 				sandbox = DEFAULT_SANDBOX_FILENAME;
920e0747665SSasha Levin 				kvm_run_write_sandbox_cmd(argv, argc);
921e0747665SSasha Levin 			} else {
922e0747665SSasha Levin 				/*
923e0747665SSasha Levin 				 * first unhandled parameter is treated as a kernel
924e0747665SSasha Levin 				 * image
925f967c427SPrasad Joshi 				 */
926f967c427SPrasad Joshi 				kernel_filename = argv[0];
927e0747665SSasha Levin 			}
928f967c427SPrasad Joshi 			argv++;
929f967c427SPrasad Joshi 			argc--;
930f967c427SPrasad Joshi 		}
931f967c427SPrasad Joshi 
932f967c427SPrasad Joshi 	}
933f967c427SPrasad Joshi 
93445bc2f02SPekka Enberg 	if (!kernel_filename)
935e08c0896SPrasad Joshi 		kernel_filename = find_kernel();
9368329f30bSPekka Enberg 
9378329f30bSPekka Enberg 	if (!kernel_filename) {
938e08c0896SPrasad Joshi 		kernel_usage_with_options();
9398329f30bSPekka Enberg 		return EINVAL;
9408329f30bSPekka Enberg 	}
9418329f30bSPekka Enberg 
942b0b42ba0SPekka Enberg 	vmlinux_filename = find_vmlinux();
943b0b42ba0SPekka Enberg 
944cfd63bbbSSasha Levin 	if (nrcpus == 0)
945cfd63bbbSSasha Levin 		nrcpus = nr_online_cpus;
946d77a9efaSCyrill Gorcunov 
947fd834defSPekka Enberg 	if (!ram_size)
948fd834defSPekka Enberg 		ram_size	= get_ram_size(nrcpus);
949fd834defSPekka Enberg 
950a2a002f9SIngo Molnar 	if (ram_size < MIN_RAM_SIZE_MB)
951a2a002f9SIngo Molnar 		die("Not enough memory specified: %lluMB (min %lluMB)", ram_size, MIN_RAM_SIZE_MB);
952a2a002f9SIngo Molnar 
95360ded003SPekka Enberg 	if (ram_size > host_ram_size())
9544542f276SCyrill Gorcunov 		pr_warning("Guest memory size %lluMB exceeds host physical RAM size %lluMB", ram_size, host_ram_size());
95560ded003SPekka Enberg 
956f967c427SPrasad Joshi 	ram_size <<= MB_SHIFT;
957f967c427SPrasad Joshi 
9585929637bSAsias He 	if (!dev)
9595929637bSAsias He 		dev = DEFAULT_KVM_DEV;
960f967c427SPrasad Joshi 
9619aa4a0ebSAsias He 	if (!console)
9629aa4a0ebSAsias He 		console = DEFAULT_CONSOLE;
9639aa4a0ebSAsias He 
9649aa4a0ebSAsias He 	if (!strncmp(console, "virtio", 6))
965f967c427SPrasad Joshi 		active_console  = CONSOLE_VIRTIO;
9663bbc49b6SMatt Evans 	else if (!strncmp(console, "serial", 6))
9679aa4a0ebSAsias He 		active_console  = CONSOLE_8250;
9683bbc49b6SMatt Evans 	else if (!strncmp(console, "hv", 2))
9693bbc49b6SMatt Evans 		active_console = CONSOLE_HV;
9703bbc49b6SMatt Evans 	else
9713bbc49b6SMatt Evans 		pr_warning("No console!");
972f967c427SPrasad Joshi 
973e80ddf6aSAsias He 	if (!host_ip)
974e80ddf6aSAsias He 		host_ip = DEFAULT_HOST_ADDR;
9754d67c820SSasha Levin 
976bb8ffd2fSAsias He 	if (!guest_ip)
977bb8ffd2fSAsias He 		guest_ip = DEFAULT_GUEST_ADDR;
978bb8ffd2fSAsias He 
979a4e724ddSSasha Levin 	if (!guest_mac)
980a4e724ddSSasha Levin 		guest_mac = DEFAULT_GUEST_MAC;
981a4e724ddSSasha Levin 
982d7098b9bSAsias He 	if (!host_mac)
983d7098b9bSAsias He 		host_mac = DEFAULT_HOST_MAC;
984d7098b9bSAsias He 
98573b7d038SAmos Kong 	if (!script)
98673b7d038SAmos Kong 		script = DEFAULT_SCRIPT;
98773b7d038SAmos Kong 
988f967c427SPrasad Joshi 	term_init();
989f967c427SPrasad Joshi 
9902d96f6b6SSasha Levin 	if (!guest_name) {
991587a4d17SLai Jiangshan 		if (custom_rootfs) {
992587a4d17SLai Jiangshan 			guest_name = custom_rootfs_name;
993587a4d17SLai Jiangshan 		} else {
9942d96f6b6SSasha Levin 			sprintf(default_name, "guest-%u", getpid());
9952d96f6b6SSasha Levin 			guest_name = default_name;
9962d96f6b6SSasha Levin 		}
997587a4d17SLai Jiangshan 	}
9982d96f6b6SSasha Levin 
99961061257SMatt Evans 	kvm = kvm__init(dev, hugetlbfs_path, ram_size, guest_name);
1000f967c427SPrasad Joshi 
10016d6a4d41SPekka Enberg 	kvm->single_step = single_step;
10026d6a4d41SPekka Enberg 
1003e1337781SSasha Levin 	ioeventfd__init(kvm);
100437f3d50eSSasha Levin 
1005384922b3SPekka Enberg 	max_cpus = kvm__max_cpus(kvm);
10068259b8ccSSasha Levin 	recommended_cpus = kvm__recommended_cpus(kvm);
1007384922b3SPekka Enberg 
1008384922b3SPekka Enberg 	if (nrcpus > max_cpus) {
1009384922b3SPekka Enberg 		printf("  # Limit the number of CPUs to %d\n", max_cpus);
101090c05188SMatt Evans 		nrcpus = max_cpus;
10118259b8ccSSasha Levin 	} else if (nrcpus > recommended_cpus) {
10128259b8ccSSasha Levin 		printf("  # Warning: The maximum recommended amount of VCPUs"
10138259b8ccSSasha Levin 			" is %d\n", recommended_cpus);
1014384922b3SPekka Enberg 	}
1015384922b3SPekka Enberg 
10160c7c14a7SCyrill Gorcunov 	kvm->nrcpus = nrcpus;
10170c7c14a7SCyrill Gorcunov 
1018e2077857SMatt Evans 	/* Alloc one pointer too many, so array ends up 0-terminated */
1019e2077857SMatt Evans 	kvm_cpus = calloc(nrcpus + 1, sizeof(void *));
1020e2077857SMatt Evans 	if (!kvm_cpus)
1021e2077857SMatt Evans 		die("Couldn't allocate array for %d CPUs", nrcpus);
1022e2077857SMatt Evans 
1023e3c4f8aaSSasha Levin 	r = irq__init(kvm);
1024e3c4f8aaSSasha Levin 	if (r < 0) {
1025e3c4f8aaSSasha Levin 		pr_err("irq__init() failed with error %d\n", r);
1026e3c4f8aaSSasha Levin 		goto fail;
1027e3c4f8aaSSasha Levin 	}
102819e6c8b8SMatt Evans 
1029b91be965SMatt Evans 	pci__init();
1030b91be965SMatt Evans 
1031890364f8SCyrill Gorcunov 	/*
1032890364f8SCyrill Gorcunov 	 * vidmode should be either specified
1033890364f8SCyrill Gorcunov 	 * either set by default
1034890364f8SCyrill Gorcunov 	 */
1035890364f8SCyrill Gorcunov 	if (vnc || sdl) {
1036890364f8SCyrill Gorcunov 		if (vidmode == -1)
1037890364f8SCyrill Gorcunov 			vidmode = 0x312;
1038*48d9e01aSSasha Levin 	} else {
1039890364f8SCyrill Gorcunov 		vidmode = 0;
1040*48d9e01aSSasha Levin 	}
1041890364f8SCyrill Gorcunov 
104226c853e4SPrasad Joshi 	memset(real_cmdline, 0, sizeof(real_cmdline));
10438e704a7aSMatt Evans 	kvm__arch_set_cmdline(real_cmdline, vnc || sdl);
10448e704a7aSMatt Evans 
10458e704a7aSMatt Evans 	if (strlen(real_cmdline) > 0)
1046d74181ccSSasha Levin 		strcat(real_cmdline, " ");
10478e704a7aSMatt Evans 
104826c853e4SPrasad Joshi 	if (kernel_cmdline)
104926c853e4SPrasad Joshi 		strlcat(real_cmdline, kernel_cmdline, sizeof(real_cmdline));
105026c853e4SPrasad Joshi 
1051c5174622SMatt Evans 	if (!using_rootfs && !image_filename[0] && !initrd_filename) {
1052c8675741SSasha Levin 		char tmp[PATH_MAX];
10536df1471eSPekka Enberg 
1054cb540c93SSasha Levin 		kvm_setup_create_new(custom_rootfs_name);
1055cb540c93SSasha Levin 		kvm_setup_resolv(custom_rootfs_name);
1056c8675741SSasha Levin 
10579667701cSPekka Enberg 		snprintf(tmp, PATH_MAX, "%s%s", kvm__get_dir(), "default");
1058c8675741SSasha Levin 		if (virtio_9p__register(kvm, tmp, "/dev/root") < 0)
1059c8675741SSasha Levin 			die("Unable to initialize virtio 9p");
1060c8675741SSasha Levin 		if (virtio_9p__register(kvm, "/", "hostfs") < 0)
1061c8675741SSasha Levin 			die("Unable to initialize virtio 9p");
1062c8675741SSasha Levin 		using_rootfs = custom_rootfs = 1;
106326c853e4SPrasad Joshi 	}
106426c853e4SPrasad Joshi 
106582d65b5eSSasha Levin 	if (using_rootfs) {
1066ff42603fSSasha Levin 		strcat(real_cmdline, " root=/dev/root rw rootflags=rw,trans=virtio,version=9p2000.L rootfstype=9p");
1067a8e6b4b9SSasha Levin 		if (custom_rootfs) {
1068d50fe489SSasha Levin 			kvm_run_set_sandbox();
1069d50fe489SSasha Levin 
1070a8e6b4b9SSasha Levin 			strcat(real_cmdline, " init=/virt/init");
1071d50fe489SSasha Levin 
1072a8e6b4b9SSasha Levin 			if (!no_dhcp)
1073a8e6b4b9SSasha Levin 				strcat(real_cmdline, "  ip=dhcp");
10749cec19c8SSasha Levin 			if (kvm_custom_stage2())
10759cec19c8SSasha Levin 				die("Failed linking stage 2 of init.");
1076a8e6b4b9SSasha Levin 		}
107782d65b5eSSasha Levin 	} else if (!strstr(real_cmdline, "root=")) {
1078ff42603fSSasha Levin 		strlcat(real_cmdline, " root=/dev/vda rw ", sizeof(real_cmdline));
107982d65b5eSSasha Levin 	}
108059aa2d30SSasha Levin 
1081c1ed214eSPrasad Joshi 	if (image_count) {
1082bcb6aacaSPrasad Joshi 		kvm->nr_disks = image_count;
1083c1ed214eSPrasad Joshi 		kvm->disks    = disk_image__open_all(image_filename, readonly_image, image_count);
1084c1ed214eSPrasad Joshi 		if (!kvm->disks)
1085c1ed214eSPrasad Joshi 			die("Unable to load all disk images.");
108638605e1cSSasha Levin 
1087bcb6aacaSPrasad Joshi 		virtio_blk__init_all(kvm);
1088f967c427SPrasad Joshi 	}
1089c1ed214eSPrasad Joshi 
1090ee8b1456SWanlong Gao 	printf("  # %s run -k %s -m %Lu -c %d --name %s\n", KVM_BINARY_NAME,
1091ee8b1456SWanlong Gao 		kernel_filename, ram_size / 1024 / 1024, nrcpus, guest_name);
1092471c6facSPekka Enberg 
1093f967c427SPrasad Joshi 	if (!kvm__load_kernel(kvm, kernel_filename, initrd_filename,
10945ffd4178SJohn Floren 				real_cmdline, vidmode))
1095f967c427SPrasad Joshi 		die("unable to load kernel %s", kernel_filename);
1096f967c427SPrasad Joshi 
1097b0b42ba0SPekka Enberg 	kvm->vmlinux = vmlinux_filename;
10984932d174SSasha Levin 	r = symbol__init(kvm);
10994932d174SSasha Levin 	if (r < 0) {
11004932d174SSasha Levin 		pr_err("symbol__init() failed with error %d\n", r);
11014932d174SSasha Levin 		goto fail;
11024932d174SSasha Levin 	}
1103b0b42ba0SPekka Enberg 
1104af7b0868SMatt Evans 	ioport__setup_arch();
1105ac38f433SPekka Enberg 
110664136c1cSPekka Enberg 	rtc__init();
110764136c1cSPekka Enberg 
1108f967c427SPrasad Joshi 	serial8250__init(kvm);
1109f967c427SPrasad Joshi 
11101621292eSSasha Levin 	if (active_console == CONSOLE_VIRTIO)
1111f967c427SPrasad Joshi 		virtio_console__init(kvm);
1112f967c427SPrasad Joshi 
111353eca082SSasha Levin 	if (virtio_rng)
111453eca082SSasha Levin 		virtio_rng__init(kvm);
111553eca082SSasha Levin 
111682d2f21eSSasha Levin 	if (balloon)
111782d2f21eSSasha Levin 		virtio_bln__init(kvm);
111882d2f21eSSasha Levin 
11194f56d42cSAsias He 	if (!network)
11204f56d42cSAsias He 		network = DEFAULT_NETWORK;
11214f56d42cSAsias He 
1122c7838fbdSSasha Levin 	virtio_9p__init(kvm);
1123c7838fbdSSasha Levin 
11249a6d73f1SSasha Levin 	for (i = 0; i < num_net_devices; i++) {
11259a6d73f1SSasha Levin 		net_params[i].kvm = kvm;
11269a6d73f1SSasha Levin 		virtio_net__init(&net_params[i]);
11279a6d73f1SSasha Levin 	}
1128a4e724ddSSasha Levin 
11299a6d73f1SSasha Levin 	if (num_net_devices == 0 && no_net == 0) {
11309a6d73f1SSasha Levin 		struct virtio_net_params net_params;
11319a6d73f1SSasha Levin 
11329a6d73f1SSasha Levin 		net_params = (struct virtio_net_params) {
11339a6d73f1SSasha Levin 			.guest_ip	= guest_ip,
11349a6d73f1SSasha Levin 			.host_ip	= host_ip,
11359a6d73f1SSasha Levin 			.kvm		= kvm,
11369a6d73f1SSasha Levin 			.script		= script,
11379a6d73f1SSasha Levin 			.mode		= NET_MODE_USER,
11389a6d73f1SSasha Levin 		};
11399a6d73f1SSasha Levin 		str_to_mac(guest_mac, net_params.guest_mac);
11409a6d73f1SSasha Levin 		str_to_mac(host_mac, net_params.host_mac);
11419a6d73f1SSasha Levin 
1142bdfcfca6SSasha Levin 		virtio_net__init(&net_params);
1143bdfcfca6SSasha Levin 	}
11444f56d42cSAsias He 
1145839051d9SSasha Levin 	kvm__init_ram(kvm);
1146839051d9SSasha Levin 
114757d7832bSMatt Evans #ifdef CONFIG_X86
1148714e5b7fSSasha Levin 	kbd__init(kvm);
114957d7832bSMatt Evans #endif
1150714e5b7fSSasha Levin 
115195d13a52SSasha Levin 	pci_shmem__init(kvm);
115295d13a52SSasha Levin 
1153*48d9e01aSSasha Levin 	if (vnc || sdl) {
11543f838fecSPekka Enberg 		fb = vesa__init(kvm);
1155*48d9e01aSSasha Levin 		if (IS_ERR(fb)) {
1156*48d9e01aSSasha Levin 			pr_err("vesa__init() failed with error %ld\n", PTR_ERR(fb));
1157*48d9e01aSSasha Levin 			goto fail;
1158*48d9e01aSSasha Levin 		}
11593f838fecSPekka Enberg 	}
11603f838fecSPekka Enberg 
1161*48d9e01aSSasha Levin 	if (vnc && fb) {
1162*48d9e01aSSasha Levin 		r = vnc__init(fb);
1163*48d9e01aSSasha Levin 		if (r < 0) {
1164*48d9e01aSSasha Levin 			pr_err("vnc__init() failed with error %d\n", r);
1165*48d9e01aSSasha Levin 			goto fail;
1166*48d9e01aSSasha Levin 		}
1167*48d9e01aSSasha Levin 	}
1168*48d9e01aSSasha Levin 
1169*48d9e01aSSasha Levin 	if (sdl && fb) {
11703f838fecSPekka Enberg 		sdl__init(fb);
1171*48d9e01aSSasha Levin 		if (r < 0) {
1172*48d9e01aSSasha Levin 			pr_err("sdl__init() failed with error %d\n", r);
1173*48d9e01aSSasha Levin 			goto fail;
1174*48d9e01aSSasha Levin 		}
11753f838fecSPekka Enberg 	}
1176aba1efa5SPekka Enberg 
1177*48d9e01aSSasha Levin 	r = fb__start();
1178*48d9e01aSSasha Levin 	if (r < 0) {
1179*48d9e01aSSasha Levin 		pr_err("fb__init() failed with error %d\n", r);
1180*48d9e01aSSasha Levin 		goto fail;
1181*48d9e01aSSasha Levin 	}
1182aba1efa5SPekka Enberg 
118325af47eeSMatt Evans 	/* Device init all done; firmware init must
118425af47eeSMatt Evans 	 * come after this (it may set up device trees etc.)
118525af47eeSMatt Evans 	 */
118625af47eeSMatt Evans 
118725af47eeSMatt Evans 	kvm__start_timer(kvm);
118825af47eeSMatt Evans 
1189e1e46fe6SSasha Levin 	kvm__arch_setup_firmware(kvm);
119025af47eeSMatt Evans 
119125af47eeSMatt Evans 	for (i = 0; i < nrcpus; i++) {
119225af47eeSMatt Evans 		kvm_cpus[i] = kvm_cpu__init(kvm, i);
119325af47eeSMatt Evans 		if (!kvm_cpus[i])
119425af47eeSMatt Evans 			die("unable to initialize KVM VCPU");
119525af47eeSMatt Evans 	}
119625af47eeSMatt Evans 
1197d60bafe5SSasha Levin 	thread_pool__init(nr_online_cpus);
119837f3d50eSSasha Levin 	ioeventfd__start();
1199d60bafe5SSasha Levin 
12004932d174SSasha Levin fail:
12014932d174SSasha Levin 	return r;
1202e1e46fe6SSasha Levin }
1203e1e46fe6SSasha Levin 
1204e1e46fe6SSasha Levin static int kvm_cmd_run_work(void)
1205e1e46fe6SSasha Levin {
1206e1e46fe6SSasha Levin 	int i, r = -1;
1207e1e46fe6SSasha Levin 	void *ret = NULL;
1208e1e46fe6SSasha Levin 
1209839051d9SSasha Levin 	for (i = 0; i < nrcpus; i++) {
1210d77a9efaSCyrill Gorcunov 		if (pthread_create(&kvm_cpus[i]->thread, NULL, kvm_cpu_thread, kvm_cpus[i]) != 0)
12115ee154d1SPekka Enberg 			die("unable to create KVM VCPU thread");
12125ee154d1SPekka Enberg 	}
12135ee154d1SPekka Enberg 
121449e5227dSSasha Levin 	/* Only VCPU #0 is going to exit by itself when shutting down */
121549e5227dSSasha Levin 	if (pthread_join(kvm_cpus[0]->thread, &ret) != 0)
1216e1e46fe6SSasha Levin 		r = 0;
12175ee154d1SPekka Enberg 
121889e0575aSPekka Enberg 	kvm_cpu__delete(kvm_cpus[0]);
121989e0575aSPekka Enberg 
122049e5227dSSasha Levin 	for (i = 1; i < nrcpus; i++) {
1221c23d9748SSasha Levin 		if (kvm_cpus[i]->is_running) {
122249e5227dSSasha Levin 			pthread_kill(kvm_cpus[i]->thread, SIGKVMEXIT);
1223d77a9efaSCyrill Gorcunov 			if (pthread_join(kvm_cpus[i]->thread, &ret) != 0)
12245ee154d1SPekka Enberg 				die("pthread_join");
122589e0575aSPekka Enberg 			kvm_cpu__delete(kvm_cpus[i]);
1226c23d9748SSasha Levin 		}
1227e1e46fe6SSasha Levin 		if (ret == NULL)
1228e1e46fe6SSasha Levin 			r = 0;
12295ee154d1SPekka Enberg 	}
1230f967c427SPrasad Joshi 
1231e1e46fe6SSasha Levin 	return r;
1232e1e46fe6SSasha Levin }
1233e1e46fe6SSasha Levin 
12344932d174SSasha Levin static void kvm_cmd_run_exit(int guest_ret)
1235e1e46fe6SSasha Levin {
12364932d174SSasha Levin 	int r = 0;
12374932d174SSasha Levin 
1238e6694207SSasha Levin 	compat__print_all_messages();
1239e6694207SSasha Levin 
12404932d174SSasha Levin 	r = symbol__exit(kvm);
12414932d174SSasha Levin 	if (r < 0)
12424932d174SSasha Levin 		pr_warning("symbol__exit() failed with error %d\n", r);
12434932d174SSasha Levin 
1244e3c4f8aaSSasha Levin 	r = irq__exit(kvm);
1245e3c4f8aaSSasha Levin 	if (r < 0)
1246e3c4f8aaSSasha Levin 		pr_warning("irq__exit() failed with error %d\n", r);
1247e3c4f8aaSSasha Levin 
1248aba1efa5SPekka Enberg 	fb__stop();
1249aba1efa5SPekka Enberg 
1250a0a1e3c2SPrasad Joshi 	virtio_blk__delete_all(kvm);
125180ac1d05SSasha Levin 	virtio_rng__delete_all(kvm);
1252a0a1e3c2SPrasad Joshi 
12539df47d00SPrasad Joshi 	disk_image__close_all(kvm->disks, image_count);
1254569b139dSPekka Enberg 	free(kvm_cpus);
1255f967c427SPrasad Joshi 	kvm__delete(kvm);
1256f967c427SPrasad Joshi 
1257e1e46fe6SSasha Levin 	if (guest_ret == 0)
1258f967c427SPrasad Joshi 		printf("\n  # KVM session ended normally.\n");
1259e1e46fe6SSasha Levin }
1260e1e46fe6SSasha Levin 
1261e1e46fe6SSasha Levin int kvm_cmd_run(int argc, const char **argv, const char *prefix)
1262e1e46fe6SSasha Levin {
12634932d174SSasha Levin 	int r, ret = -EFAULT;
1264e1e46fe6SSasha Levin 
1265e1e46fe6SSasha Levin 	r = kvm_cmd_run_init(argc, argv);
1266e1e46fe6SSasha Levin 	if (r < 0)
1267e1e46fe6SSasha Levin 		return r;
1268e1e46fe6SSasha Levin 
1269e1e46fe6SSasha Levin 	ret = kvm_cmd_run_work();
1270e1e46fe6SSasha Levin 	kvm_cmd_run_exit(ret);
1271e1e46fe6SSasha Levin 
1272e1e46fe6SSasha Levin 	return ret;
1273f967c427SPrasad Joshi }
1274