xref: /kvmtool/builtin-run.c (revision afc2c7c0ba836937d65fb5bd5f76864a0371c52f)
1ece09f8fSPekka Enberg #include "kvm/builtin-run.h"
2ece09f8fSPekka Enberg 
3c8675741SSasha Levin #include "kvm/builtin-setup.h"
4ece09f8fSPekka Enberg #include "kvm/virtio-balloon.h"
5ece09f8fSPekka Enberg #include "kvm/virtio-console.h"
6ece09f8fSPekka Enberg #include "kvm/parse-options.h"
7ece09f8fSPekka Enberg #include "kvm/8250-serial.h"
8ece09f8fSPekka Enberg #include "kvm/framebuffer.h"
9ece09f8fSPekka Enberg #include "kvm/disk-image.h"
10ece09f8fSPekka Enberg #include "kvm/threadpool.h"
11a67da3beSAsias He #include "kvm/virtio-scsi.h"
12ece09f8fSPekka Enberg #include "kvm/virtio-blk.h"
13ece09f8fSPekka Enberg #include "kvm/virtio-net.h"
14ece09f8fSPekka Enberg #include "kvm/virtio-rng.h"
15ece09f8fSPekka Enberg #include "kvm/ioeventfd.h"
16ece09f8fSPekka Enberg #include "kvm/virtio-9p.h"
17ece09f8fSPekka Enberg #include "kvm/barrier.h"
18ece09f8fSPekka Enberg #include "kvm/kvm-cpu.h"
19ece09f8fSPekka Enberg #include "kvm/ioport.h"
20ece09f8fSPekka Enberg #include "kvm/symbol.h"
21ece09f8fSPekka Enberg #include "kvm/i8042.h"
22ece09f8fSPekka Enberg #include "kvm/mutex.h"
23ece09f8fSPekka Enberg #include "kvm/term.h"
24ece09f8fSPekka Enberg #include "kvm/util.h"
25ec52d504SLai Jiangshan #include "kvm/strbuf.h"
26ece09f8fSPekka Enberg #include "kvm/vesa.h"
27ece09f8fSPekka Enberg #include "kvm/irq.h"
28ece09f8fSPekka Enberg #include "kvm/kvm.h"
29ece09f8fSPekka Enberg #include "kvm/pci.h"
30ece09f8fSPekka Enberg #include "kvm/rtc.h"
31ece09f8fSPekka Enberg #include "kvm/sdl.h"
32ece09f8fSPekka Enberg #include "kvm/vnc.h"
33e6694207SSasha Levin #include "kvm/guest_compat.h"
3495d13a52SSasha Levin #include "kvm/pci-shmem.h"
354b1addaeSSasha Levin #include "kvm/kvm-ipc.h"
364b1c6f6eSSasha Levin #include "kvm/builtin-debug.h"
37ece09f8fSPekka Enberg 
38ece09f8fSPekka Enberg #include <linux/types.h>
3948d9e01aSSasha Levin #include <linux/err.h>
40ece09f8fSPekka Enberg 
418329f30bSPekka Enberg #include <sys/utsname.h>
428329f30bSPekka Enberg #include <sys/types.h>
438329f30bSPekka Enberg #include <sys/stat.h>
44ece09f8fSPekka Enberg #include <termios.h>
45ece09f8fSPekka Enberg #include <signal.h>
46ece09f8fSPekka Enberg #include <stdlib.h>
47ece09f8fSPekka Enberg #include <string.h>
48ece09f8fSPekka Enberg #include <unistd.h>
4926c853e4SPrasad Joshi #include <ctype.h>
50ece09f8fSPekka Enberg #include <stdio.h>
51f967c427SPrasad Joshi 
52f967c427SPrasad Joshi #define DEFAULT_KVM_DEV		"/dev/kvm"
539aa4a0ebSAsias He #define DEFAULT_CONSOLE		"serial"
54bd30e200SAsias He #define DEFAULT_NETWORK		"user"
55745c7231SAsias He #define DEFAULT_HOST_ADDR	"192.168.33.1"
56bb8ffd2fSAsias He #define DEFAULT_GUEST_ADDR	"192.168.33.15"
577c88c87eSSasha Levin #define DEFAULT_GUEST_MAC	"02:15:15:15:15:15"
587c88c87eSSasha Levin #define DEFAULT_HOST_MAC	"02:01:01:01:01:01"
5973b7d038SAmos Kong #define DEFAULT_SCRIPT		"none"
603c29e2aaSSasha Levin const char *DEFAULT_SANDBOX_FILENAME = "guest/sandbox.sh";
61f967c427SPrasad Joshi 
62f967c427SPrasad Joshi #define MB_SHIFT		(20)
6395d13a52SSasha Levin #define KB_SHIFT		(10)
6495d13a52SSasha Levin #define GB_SHIFT		(30)
65a2a002f9SIngo Molnar #define MIN_RAM_SIZE_MB		(64ULL)
66f967c427SPrasad Joshi #define MIN_RAM_SIZE_BYTE	(MIN_RAM_SIZE_MB << MB_SHIFT)
67f967c427SPrasad Joshi 
684298ddadSSasha Levin struct kvm *kvm;
69e2077857SMatt Evans struct kvm_cpu **kvm_cpus;
70656be1b8SSasha Levin __thread struct kvm_cpu *current_kvm_cpu;
71f967c427SPrasad Joshi 
7297f16d66SAsias He static struct disk_image_params disk_image[MAX_DISK_IMAGES];
73fd834defSPekka Enberg static u64 ram_size;
74a33979d8SSasha Levin static u8  image_count;
759a6d73f1SSasha Levin static u8 num_net_devices;
76cf55d6aeSLiming Wang static bool virtio_rng;
77f967c427SPrasad Joshi static const char *kernel_cmdline;
78f967c427SPrasad Joshi static const char *kernel_filename;
79b0b42ba0SPekka Enberg static const char *vmlinux_filename;
80f967c427SPrasad Joshi static const char *initrd_filename;
815ad8db5eSPekka Enberg static const char *firmware_filename;
829aa4a0ebSAsias He static const char *console;
835929637bSAsias He static const char *dev;
844f56d42cSAsias He static const char *network;
85e80ddf6aSAsias He static const char *host_ip;
86bb8ffd2fSAsias He static const char *guest_ip;
87a4e724ddSSasha Levin static const char *guest_mac;
88d7098b9bSAsias He static const char *host_mac;
8973b7d038SAmos Kong static const char *script;
905358b0e6SSasha Levin static const char *guest_name;
91d50fe489SSasha Levin static const char *sandbox;
9261061257SMatt Evans static const char *hugetlbfs_path;
93cb540c93SSasha Levin static const char *custom_rootfs_name = "default";
949a6d73f1SSasha Levin static struct virtio_net_params *net_params;
950ea58e5bSPekka Enberg static bool single_step;
965ffd4178SJohn Floren static bool vnc;
973f838fecSPekka Enberg static bool sdl;
9882d2f21eSSasha Levin static bool balloon;
9959aa2d30SSasha Levin static bool using_rootfs;
10082d65b5eSSasha Levin static bool custom_rootfs;
1019a6d73f1SSasha Levin static bool no_net;
102a8e6b4b9SSasha Levin static bool no_dhcp;
103f967c427SPrasad Joshi extern bool ioport_debug;
104d562e086SCyrill Gorcunov extern bool mmio_debug;
1053c29e2aaSSasha Levin static int  kvm_run_wrapper;
106f967c427SPrasad Joshi extern int  active_console;
107aa400b00SPrasad Joshi extern int  debug_iodelay;
108f967c427SPrasad Joshi 
109ed036f03SCyrill Gorcunov bool do_debug_print = false;
110ed036f03SCyrill Gorcunov 
111cfd63bbbSSasha Levin static int nrcpus;
112890364f8SCyrill Gorcunov static int vidmode = -1;
113d77a9efaSCyrill Gorcunov 
114*afc2c7c0SAsias He extern char _binary_guest_init_stage2_start;
115*afc2c7c0SAsias He extern char _binary_guest_init_stage2_size;
116*afc2c7c0SAsias He extern char _binary_guest_init_start;
117*afc2c7c0SAsias He extern char _binary_guest_init_size;
118*afc2c7c0SAsias He 
119f967c427SPrasad Joshi static const char * const run_usage[] = {
1208d2ff5daSWanlong Gao 	"lkvm run [<options>] [<kernel image>]",
121f967c427SPrasad Joshi 	NULL
122f967c427SPrasad Joshi };
123f967c427SPrasad Joshi 
1243c29e2aaSSasha Levin enum {
125e0747665SSasha Levin 	KVM_RUN_DEFAULT,
1263c29e2aaSSasha Levin 	KVM_RUN_SANDBOX,
1273c29e2aaSSasha Levin };
1283c29e2aaSSasha Levin 
1293c29e2aaSSasha Levin void kvm_run_set_wrapper_sandbox(void)
1303c29e2aaSSasha Levin {
1313c29e2aaSSasha Levin 	kvm_run_wrapper = KVM_RUN_SANDBOX;
1323c29e2aaSSasha Levin }
1333c29e2aaSSasha Levin 
134a33979d8SSasha Levin static int img_name_parser(const struct option *opt, const char *arg, int unset)
135a33979d8SSasha Levin {
13682d65b5eSSasha Levin 	char path[PATH_MAX];
1375236b505SAsias He 	const char *cur;
1385236b505SAsias He 	struct stat st;
1395236b505SAsias He 	char *sep;
14059aa2d30SSasha Levin 
14159aa2d30SSasha Levin 	if (stat(arg, &st) == 0 &&
14259aa2d30SSasha Levin 	    S_ISDIR(st.st_mode)) {
14359aa2d30SSasha Levin 		char tmp[PATH_MAX];
14459aa2d30SSasha Levin 
1452c908af9SLai Jiangshan 		if (using_rootfs)
1462c908af9SLai Jiangshan 			die("Please use only one rootfs directory atmost");
1472c908af9SLai Jiangshan 
14859aa2d30SSasha Levin 		if (realpath(arg, tmp) == 0 ||
149c7838fbdSSasha Levin 		    virtio_9p__register(kvm, tmp, "/dev/root") < 0)
15059aa2d30SSasha Levin 			die("Unable to initialize virtio 9p");
15159aa2d30SSasha Levin 		using_rootfs = 1;
15259aa2d30SSasha Levin 		return 0;
15359aa2d30SSasha Levin 	}
154a33979d8SSasha Levin 
1559667701cSPekka Enberg 	snprintf(path, PATH_MAX, "%s%s", kvm__get_dir(), arg);
15682d65b5eSSasha Levin 
15782d65b5eSSasha Levin 	if (stat(path, &st) == 0 &&
15882d65b5eSSasha Levin 	    S_ISDIR(st.st_mode)) {
15982d65b5eSSasha Levin 		char tmp[PATH_MAX];
16082d65b5eSSasha Levin 
1612c908af9SLai Jiangshan 		if (using_rootfs)
1622c908af9SLai Jiangshan 			die("Please use only one rootfs directory atmost");
1632c908af9SLai Jiangshan 
16482d65b5eSSasha Levin 		if (realpath(path, tmp) == 0 ||
16582d65b5eSSasha Levin 		    virtio_9p__register(kvm, tmp, "/dev/root") < 0)
16682d65b5eSSasha Levin 			die("Unable to initialize virtio 9p");
16782d65b5eSSasha Levin 		if (virtio_9p__register(kvm, "/", "hostfs") < 0)
16882d65b5eSSasha Levin 			die("Unable to initialize virtio 9p");
16969c88b95SSasha Levin 		kvm_setup_resolv(arg);
17082d65b5eSSasha Levin 		using_rootfs = custom_rootfs = 1;
171cb540c93SSasha Levin 		custom_rootfs_name = arg;
17282d65b5eSSasha Levin 		return 0;
17382d65b5eSSasha Levin 	}
17482d65b5eSSasha Levin 
175a33979d8SSasha Levin 	if (image_count >= MAX_DISK_IMAGES)
176a33979d8SSasha Levin 		die("Currently only 4 images are supported");
177a33979d8SSasha Levin 
17897f16d66SAsias He 	disk_image[image_count].filename = arg;
1795236b505SAsias He 	cur = arg;
180a67da3beSAsias He 
181a67da3beSAsias He 	if (strncmp(arg, "scsi:", 5) == 0) {
182a67da3beSAsias He 		sep = strstr(arg, ":");
183a67da3beSAsias He 		if (sep)
184a67da3beSAsias He 			disk_image[image_count].wwpn = sep + 1;
185a67da3beSAsias He 		sep = strstr(sep + 1, ":");
186a67da3beSAsias He 		if (sep) {
187a67da3beSAsias He 			*sep = 0;
188a67da3beSAsias He 			disk_image[image_count].tpgt = sep + 1;
189a67da3beSAsias He 		}
190a67da3beSAsias He 		cur = sep + 1;
191a67da3beSAsias He 	}
192a67da3beSAsias He 
1935236b505SAsias He 	do {
1945236b505SAsias He 		sep = strstr(cur, ",");
195a33979d8SSasha Levin 		if (sep) {
1965236b505SAsias He 			if (strncmp(sep + 1, "ro", 2) == 0)
19797f16d66SAsias He 				disk_image[image_count].readonly = true;
1985236b505SAsias He 			else if (strncmp(sep + 1, "direct", 6) == 0)
1995236b505SAsias He 				disk_image[image_count].direct = true;
200a33979d8SSasha Levin 			*sep = 0;
2015236b505SAsias He 			cur = sep + 1;
202a33979d8SSasha Levin 		}
2035236b505SAsias He 	} while (sep);
204a33979d8SSasha Levin 
205a33979d8SSasha Levin 	image_count++;
206a33979d8SSasha Levin 
207a33979d8SSasha Levin 	return 0;
208a33979d8SSasha Levin }
209a33979d8SSasha Levin 
210b4422bf3SAneesh Kumar K.V static int virtio_9p_rootdir_parser(const struct option *opt, const char *arg, int unset)
211b4422bf3SAneesh Kumar K.V {
212b4422bf3SAneesh Kumar K.V 	char *tag_name;
213b4422bf3SAneesh Kumar K.V 	char tmp[PATH_MAX];
214b4422bf3SAneesh Kumar K.V 
215b4422bf3SAneesh Kumar K.V 	/*
216b4422bf3SAneesh Kumar K.V 	 * 9p dir can be of the form dirname,tag_name or
217b4422bf3SAneesh Kumar K.V 	 * just dirname. In the later case we use the
218b4422bf3SAneesh Kumar K.V 	 * default tag name
219b4422bf3SAneesh Kumar K.V 	 */
220b4422bf3SAneesh Kumar K.V 	tag_name = strstr(arg, ",");
221b4422bf3SAneesh Kumar K.V 	if (tag_name) {
222b4422bf3SAneesh Kumar K.V 		*tag_name = '\0';
223b4422bf3SAneesh Kumar K.V 		tag_name++;
224b4422bf3SAneesh Kumar K.V 	}
22554f6802dSPekka Enberg 	if (realpath(arg, tmp)) {
226c7838fbdSSasha Levin 		if (virtio_9p__register(kvm, tmp, tag_name) < 0)
22754f6802dSPekka Enberg 			die("Unable to initialize virtio 9p");
22854f6802dSPekka Enberg 	} else
229b4422bf3SAneesh Kumar K.V 		die("Failed resolving 9p path");
230b4422bf3SAneesh Kumar K.V 	return 0;
231b4422bf3SAneesh Kumar K.V }
232b4422bf3SAneesh Kumar K.V 
2331add4b76SSasha Levin static int tty_parser(const struct option *opt, const char *arg, int unset)
2341add4b76SSasha Levin {
2351add4b76SSasha Levin 	int tty = atoi(arg);
2361add4b76SSasha Levin 
2371add4b76SSasha Levin 	term_set_tty(tty);
2381add4b76SSasha Levin 
2391add4b76SSasha Levin 	return 0;
2401add4b76SSasha Levin }
2411add4b76SSasha Levin 
2429a6d73f1SSasha Levin static inline void str_to_mac(const char *str, char *mac)
2439a6d73f1SSasha Levin {
2449a6d73f1SSasha Levin 	sscanf(str, "%hhx:%hhx:%hhx:%hhx:%hhx:%hhx",
2459a6d73f1SSasha Levin 		mac, mac+1, mac+2, mac+3, mac+4, mac+5);
2469a6d73f1SSasha Levin }
2479a6d73f1SSasha Levin static int set_net_param(struct virtio_net_params *p, const char *param,
2489a6d73f1SSasha Levin 				const char *val)
2499a6d73f1SSasha Levin {
2509a6d73f1SSasha Levin 	if (strcmp(param, "guest_mac") == 0) {
2519a6d73f1SSasha Levin 		str_to_mac(val, p->guest_mac);
2529a6d73f1SSasha Levin 	} else if (strcmp(param, "mode") == 0) {
2539a6d73f1SSasha Levin 		if (!strncmp(val, "user", 4)) {
2549a6d73f1SSasha Levin 			int i;
2559a6d73f1SSasha Levin 
2569a6d73f1SSasha Levin 			for (i = 0; i < num_net_devices; i++)
2579a6d73f1SSasha Levin 				if (net_params[i].mode == NET_MODE_USER)
2589a6d73f1SSasha Levin 					die("Only one usermode network device allowed at a time");
2599a6d73f1SSasha Levin 			p->mode = NET_MODE_USER;
2609a6d73f1SSasha Levin 		} else if (!strncmp(val, "tap", 3)) {
2619a6d73f1SSasha Levin 			p->mode = NET_MODE_TAP;
2629a6d73f1SSasha Levin 		} else if (!strncmp(val, "none", 4)) {
2639a6d73f1SSasha Levin 			no_net = 1;
2649a6d73f1SSasha Levin 			return -1;
2659a6d73f1SSasha Levin 		} else
2669a6d73f1SSasha Levin 			die("Unkown network mode %s, please use user, tap or none", network);
2679a6d73f1SSasha Levin 	} else if (strcmp(param, "script") == 0) {
2689a6d73f1SSasha Levin 		p->script = strdup(val);
2699a6d73f1SSasha Levin 	} else if (strcmp(param, "guest_ip") == 0) {
2709a6d73f1SSasha Levin 		p->guest_ip = strdup(val);
2719a6d73f1SSasha Levin 	} else if (strcmp(param, "host_ip") == 0) {
2729a6d73f1SSasha Levin 		p->host_ip = strdup(val);
27369205aa1SAsias He 	} else if (strcmp(param, "trans") == 0) {
27469205aa1SAsias He 		p->trans = strdup(val);
2759ed67cdcSSasha Levin 	} else if (strcmp(param, "vhost") == 0) {
2769ed67cdcSSasha Levin 		p->vhost = atoi(val);
277f19edd1eSSasha Levin 	} else if (strcmp(param, "fd") == 0) {
278f19edd1eSSasha Levin 		p->fd = atoi(val);
27921aa628eSMichael Ellerman 	} else
28021aa628eSMichael Ellerman 		die("Unknown network parameter %s", param);
2819a6d73f1SSasha Levin 
2829a6d73f1SSasha Levin 	return 0;
2839a6d73f1SSasha Levin }
2849a6d73f1SSasha Levin 
2859a6d73f1SSasha Levin static int netdev_parser(const struct option *opt, const char *arg, int unset)
2869a6d73f1SSasha Levin {
2879a6d73f1SSasha Levin 	struct virtio_net_params p;
2889a6d73f1SSasha Levin 	char *buf = NULL, *cmd = NULL, *cur = NULL;
2899a6d73f1SSasha Levin 	bool on_cmd = true;
2909a6d73f1SSasha Levin 
2919a6d73f1SSasha Levin 	if (arg) {
2929a6d73f1SSasha Levin 		buf = strdup(arg);
2939a6d73f1SSasha Levin 		if (buf == NULL)
2949a6d73f1SSasha Levin 			die("Failed allocating new net buffer");
2959a6d73f1SSasha Levin 		cur = strtok(buf, ",=");
2969a6d73f1SSasha Levin 	}
2979a6d73f1SSasha Levin 
2989a6d73f1SSasha Levin 	p = (struct virtio_net_params) {
2999a6d73f1SSasha Levin 		.guest_ip	= DEFAULT_GUEST_ADDR,
3009a6d73f1SSasha Levin 		.host_ip	= DEFAULT_HOST_ADDR,
3019a6d73f1SSasha Levin 		.script		= DEFAULT_SCRIPT,
3029a6d73f1SSasha Levin 		.mode		= NET_MODE_TAP,
3039a6d73f1SSasha Levin 	};
3049a6d73f1SSasha Levin 
3059a6d73f1SSasha Levin 	str_to_mac(DEFAULT_GUEST_MAC, p.guest_mac);
3069a6d73f1SSasha Levin 	p.guest_mac[5] += num_net_devices;
3079a6d73f1SSasha Levin 
3089a6d73f1SSasha Levin 	while (cur) {
3099a6d73f1SSasha Levin 		if (on_cmd) {
3109a6d73f1SSasha Levin 			cmd = cur;
3119a6d73f1SSasha Levin 		} else {
3129a6d73f1SSasha Levin 			if (set_net_param(&p, cmd, cur) < 0)
3139a6d73f1SSasha Levin 				goto done;
3149a6d73f1SSasha Levin 		}
3159a6d73f1SSasha Levin 		on_cmd = !on_cmd;
3169a6d73f1SSasha Levin 
3179a6d73f1SSasha Levin 		cur = strtok(NULL, ",=");
3189a6d73f1SSasha Levin 	};
3199a6d73f1SSasha Levin 
3209a6d73f1SSasha Levin 	num_net_devices++;
3219a6d73f1SSasha Levin 
3229a6d73f1SSasha Levin 	net_params = realloc(net_params, num_net_devices * sizeof(*net_params));
3239a6d73f1SSasha Levin 	if (net_params == NULL)
3249a6d73f1SSasha Levin 		die("Failed adding new network device");
3259a6d73f1SSasha Levin 
3269a6d73f1SSasha Levin 	net_params[num_net_devices - 1] = p;
3279a6d73f1SSasha Levin 
3289a6d73f1SSasha Levin done:
3299a6d73f1SSasha Levin 	free(buf);
3309a6d73f1SSasha Levin 	return 0;
3319a6d73f1SSasha Levin }
3329a6d73f1SSasha Levin 
33395d13a52SSasha Levin static int shmem_parser(const struct option *opt, const char *arg, int unset)
33495d13a52SSasha Levin {
33572f1ad6dSSasha Levin 	const u64 default_size = SHMEM_DEFAULT_SIZE;
33672f1ad6dSSasha Levin 	const u64 default_phys_addr = SHMEM_DEFAULT_ADDR;
33795d13a52SSasha Levin 	const char *default_handle = SHMEM_DEFAULT_HANDLE;
33895d13a52SSasha Levin 	struct shmem_info *si = malloc(sizeof(struct shmem_info));
33972f1ad6dSSasha Levin 	u64 phys_addr;
34072f1ad6dSSasha Levin 	u64 size;
34195d13a52SSasha Levin 	char *handle = NULL;
34295d13a52SSasha Levin 	int create = 0;
34395d13a52SSasha Levin 	const char *p = arg;
34495d13a52SSasha Levin 	char *next;
34595d13a52SSasha Levin 	int base = 10;
34695d13a52SSasha Levin 	int verbose = 0;
34795d13a52SSasha Levin 
34895d13a52SSasha Levin 	const int skip_pci = strlen("pci:");
34995d13a52SSasha Levin 	if (verbose)
35095d13a52SSasha Levin 		pr_info("shmem_parser(%p,%s,%d)", opt, arg, unset);
35195d13a52SSasha Levin 	/* parse out optional addr family */
35295d13a52SSasha Levin 	if (strcasestr(p, "pci:")) {
35395d13a52SSasha Levin 		p += skip_pci;
35495d13a52SSasha Levin 	} else if (strcasestr(p, "mem:")) {
35595d13a52SSasha Levin 		die("I can't add to E820 map yet.\n");
35695d13a52SSasha Levin 	}
35795d13a52SSasha Levin 	/* parse out physical addr */
35895d13a52SSasha Levin 	base = 10;
35995d13a52SSasha Levin 	if (strcasestr(p, "0x"))
36095d13a52SSasha Levin 		base = 16;
36195d13a52SSasha Levin 	phys_addr = strtoll(p, &next, base);
36295d13a52SSasha Levin 	if (next == p && phys_addr == 0) {
36395d13a52SSasha Levin 		pr_info("shmem: no physical addr specified, using default.");
36495d13a52SSasha Levin 		phys_addr = default_phys_addr;
36595d13a52SSasha Levin 	}
36695d13a52SSasha Levin 	if (*next != ':' && *next != '\0')
36795d13a52SSasha Levin 		die("shmem: unexpected chars after phys addr.\n");
36895d13a52SSasha Levin 	if (*next == '\0')
36995d13a52SSasha Levin 		p = next;
37095d13a52SSasha Levin 	else
37195d13a52SSasha Levin 		p = next + 1;
37295d13a52SSasha Levin 	/* parse out size */
37395d13a52SSasha Levin 	base = 10;
37495d13a52SSasha Levin 	if (strcasestr(p, "0x"))
37595d13a52SSasha Levin 		base = 16;
37695d13a52SSasha Levin 	size = strtoll(p, &next, base);
37795d13a52SSasha Levin 	if (next == p && size == 0) {
37895d13a52SSasha Levin 		pr_info("shmem: no size specified, using default.");
37995d13a52SSasha Levin 		size = default_size;
38095d13a52SSasha Levin 	}
38195d13a52SSasha Levin 	/* look for [KMGkmg][Bb]*  uses base 2. */
38295d13a52SSasha Levin 	int skip_B = 0;
38395d13a52SSasha Levin 	if (strspn(next, "KMGkmg")) {	/* might have a prefix */
38495d13a52SSasha Levin 		if (*(next + 1) == 'B' || *(next + 1) == 'b')
38595d13a52SSasha Levin 			skip_B = 1;
38695d13a52SSasha Levin 		switch (*next) {
38795d13a52SSasha Levin 		case 'K':
38895d13a52SSasha Levin 		case 'k':
38995d13a52SSasha Levin 			size = size << KB_SHIFT;
39095d13a52SSasha Levin 			break;
39195d13a52SSasha Levin 		case 'M':
39295d13a52SSasha Levin 		case 'm':
39395d13a52SSasha Levin 			size = size << MB_SHIFT;
39495d13a52SSasha Levin 			break;
39595d13a52SSasha Levin 		case 'G':
39695d13a52SSasha Levin 		case 'g':
39795d13a52SSasha Levin 			size = size << GB_SHIFT;
39895d13a52SSasha Levin 			break;
39995d13a52SSasha Levin 		default:
40095d13a52SSasha Levin 			die("shmem: bug in detecting size prefix.");
40195d13a52SSasha Levin 			break;
40295d13a52SSasha Levin 		}
40395d13a52SSasha Levin 		next += 1 + skip_B;
40495d13a52SSasha Levin 	}
40595d13a52SSasha Levin 	if (*next != ':' && *next != '\0') {
40695d13a52SSasha Levin 		die("shmem: unexpected chars after phys size. <%c><%c>\n",
40795d13a52SSasha Levin 		    *next, *p);
40895d13a52SSasha Levin 	}
40995d13a52SSasha Levin 	if (*next == '\0')
41095d13a52SSasha Levin 		p = next;
41195d13a52SSasha Levin 	else
41295d13a52SSasha Levin 		p = next + 1;
41395d13a52SSasha Levin 	/* parse out optional shmem handle */
41495d13a52SSasha Levin 	const int skip_handle = strlen("handle=");
41595d13a52SSasha Levin 	next = strcasestr(p, "handle=");
41695d13a52SSasha Levin 	if (*p && next) {
41795d13a52SSasha Levin 		if (p != next)
41895d13a52SSasha Levin 			die("unexpected chars before handle\n");
41995d13a52SSasha Levin 		p += skip_handle;
42095d13a52SSasha Levin 		next = strchrnul(p, ':');
42195d13a52SSasha Levin 		if (next - p) {
42295d13a52SSasha Levin 			handle = malloc(next - p + 1);
42395d13a52SSasha Levin 			strncpy(handle, p, next - p);
42495d13a52SSasha Levin 			handle[next - p] = '\0';	/* just in case. */
42595d13a52SSasha Levin 		}
42695d13a52SSasha Levin 		if (*next == '\0')
42795d13a52SSasha Levin 			p = next;
42895d13a52SSasha Levin 		else
42995d13a52SSasha Levin 			p = next + 1;
43095d13a52SSasha Levin 	}
43195d13a52SSasha Levin 	/* parse optional create flag to see if we should create shm seg. */
43295d13a52SSasha Levin 	if (*p && strcasestr(p, "create")) {
43395d13a52SSasha Levin 		create = 1;
43495d13a52SSasha Levin 		p += strlen("create");
43595d13a52SSasha Levin 	}
43695d13a52SSasha Levin 	if (*p != '\0')
43795d13a52SSasha Levin 		die("shmem: unexpected trailing chars\n");
43895d13a52SSasha Levin 	if (handle == NULL) {
43995d13a52SSasha Levin 		handle = malloc(strlen(default_handle) + 1);
44095d13a52SSasha Levin 		strcpy(handle, default_handle);
44195d13a52SSasha Levin 	}
44295d13a52SSasha Levin 	if (verbose) {
44372f1ad6dSSasha Levin 		pr_info("shmem: phys_addr = %llx", phys_addr);
44472f1ad6dSSasha Levin 		pr_info("shmem: size      = %llx", size);
44595d13a52SSasha Levin 		pr_info("shmem: handle    = %s", handle);
44695d13a52SSasha Levin 		pr_info("shmem: create    = %d", create);
44795d13a52SSasha Levin 	}
44895d13a52SSasha Levin 
44995d13a52SSasha Levin 	si->phys_addr = phys_addr;
45095d13a52SSasha Levin 	si->size = size;
45195d13a52SSasha Levin 	si->handle = handle;
45295d13a52SSasha Levin 	si->create = create;
45395d13a52SSasha Levin 	pci_shmem__register_mem(si);	/* ownership of si, etc. passed on. */
45495d13a52SSasha Levin 	return 0;
45595d13a52SSasha Levin }
456b4422bf3SAneesh Kumar K.V 
457f967c427SPrasad Joshi static const struct option options[] = {
4585e3af62dSSasha Levin 	OPT_GROUP("Basic options:"),
4595358b0e6SSasha Levin 	OPT_STRING('\0', "name", &guest_name, "guest name",
4605358b0e6SSasha Levin 			"A name for the guest"),
46180b1f72fSPekka Enberg 	OPT_INTEGER('c', "cpus", &nrcpus, "Number of CPUs"),
462f967c427SPrasad Joshi 	OPT_U64('m', "mem", &ram_size, "Virtual machine memory size in MiB."),
46395d13a52SSasha Levin 	OPT_CALLBACK('\0', "shmem", NULL,
46495d13a52SSasha Levin 		     "[pci:]<addr>:<size>[:handle=<handle>][:create]",
46595d13a52SSasha Levin 		     "Share host shmem with guest via pci device",
46695d13a52SSasha Levin 		     shmem_parser),
467cadb9ab7SAsias He 	OPT_CALLBACK('d', "disk", NULL, "image or rootfs_dir", "Disk image or rootfs directory", img_name_parser),
46882d2f21eSSasha Levin 	OPT_BOOLEAN('\0', "balloon", &balloon, "Enable virtio balloon"),
4695ffd4178SJohn Floren 	OPT_BOOLEAN('\0', "vnc", &vnc, "Enable VNC framebuffer"),
4703f838fecSPekka Enberg 	OPT_BOOLEAN('\0', "sdl", &sdl, "Enable SDL framebuffer"),
471cf55d6aeSLiming Wang 	OPT_BOOLEAN('\0', "rng", &virtio_rng, "Enable virtio Random Number Generator"),
4728b7565e8SAsias He 	OPT_CALLBACK('\0', "9p", NULL, "dir_to_share,tag_name",
4738b7565e8SAsias He 		     "Enable virtio 9p to share files between host and guest", virtio_9p_rootdir_parser),
4743bbc49b6SMatt Evans 	OPT_STRING('\0', "console", &console, "serial, virtio or hv",
4758b7565e8SAsias He 			"Console to use"),
4768b7565e8SAsias He 	OPT_STRING('\0', "dev", &dev, "device_file", "KVM device file"),
4771add4b76SSasha Levin 	OPT_CALLBACK('\0', "tty", NULL, "tty id",
4781add4b76SSasha Levin 		     "Remap guest TTY into a pty on the host",
4791add4b76SSasha Levin 		     tty_parser),
480d50fe489SSasha Levin 	OPT_STRING('\0', "sandbox", &sandbox, "script",
481d50fe489SSasha Levin 			"Run this script when booting into custom rootfs"),
48261061257SMatt Evans 	OPT_STRING('\0', "hugetlbfs", &hugetlbfs_path, "path", "Hugetlbfs path"),
4835e3af62dSSasha Levin 
4845e3af62dSSasha Levin 	OPT_GROUP("Kernel options:"),
4855e3af62dSSasha Levin 	OPT_STRING('k', "kernel", &kernel_filename, "kernel",
4865e3af62dSSasha Levin 			"Kernel to boot in virtual machine"),
487d6c19027SAsias He 	OPT_STRING('i', "initrd", &initrd_filename, "initrd",
4885e3af62dSSasha Levin 			"Initial RAM disk image"),
4895e3af62dSSasha Levin 	OPT_STRING('p', "params", &kernel_cmdline, "params",
4905e3af62dSSasha Levin 			"Kernel command line arguments"),
4915ad8db5eSPekka Enberg 	OPT_STRING('f', "firmware", &firmware_filename, "firmware",
4925ad8db5eSPekka Enberg 			"Firmware image to boot in virtual machine"),
4935e3af62dSSasha Levin 
4944d67c820SSasha Levin 	OPT_GROUP("Networking options:"),
4959a6d73f1SSasha Levin 	OPT_CALLBACK_DEFAULT('n', "network", NULL, "network params",
4969a6d73f1SSasha Levin 		     "Create a new guest NIC",
4979a6d73f1SSasha Levin 		     netdev_parser, NULL),
498a8e6b4b9SSasha Levin 	OPT_BOOLEAN('\0', "no-dhcp", &no_dhcp, "Disable kernel DHCP in rootfs mode"),
499d6c19027SAsias He 
500890364f8SCyrill Gorcunov 	OPT_GROUP("BIOS options:"),
501890364f8SCyrill Gorcunov 	OPT_INTEGER('\0', "vidmode", &vidmode,
502890364f8SCyrill Gorcunov 		    "Video mode"),
503890364f8SCyrill Gorcunov 
5045e3af62dSSasha Levin 	OPT_GROUP("Debug options:"),
505ed036f03SCyrill Gorcunov 	OPT_BOOLEAN('\0', "debug", &do_debug_print,
506ed036f03SCyrill Gorcunov 			"Enable debug messages"),
507d6c19027SAsias He 	OPT_BOOLEAN('\0', "debug-single-step", &single_step,
508d6c19027SAsias He 			"Enable single stepping"),
509001690a4SSasha Levin 	OPT_BOOLEAN('\0', "debug-ioport", &ioport_debug,
510d6c19027SAsias He 			"Enable ioport debugging"),
511d562e086SCyrill Gorcunov 	OPT_BOOLEAN('\0', "debug-mmio", &mmio_debug,
512d562e086SCyrill Gorcunov 			"Enable MMIO debugging"),
513001690a4SSasha Levin 	OPT_INTEGER('\0', "debug-iodelay", &debug_iodelay,
514aa400b00SPrasad Joshi 			"Delay IO by millisecond"),
515f967c427SPrasad Joshi 	OPT_END()
516f967c427SPrasad Joshi };
517f967c427SPrasad Joshi 
518b5b501ccSIngo Molnar /*
519b5b501ccSIngo Molnar  * Serialize debug printout so that the output of multiple vcpus does not
520b5b501ccSIngo Molnar  * get mixed up:
521b5b501ccSIngo Molnar  */
522cffeab25SIngo Molnar static int printout_done;
523b5b501ccSIngo Molnar 
52443119af7SPekka Enberg static void handle_sigusr1(int sig)
52543119af7SPekka Enberg {
52643119af7SPekka Enberg 	struct kvm_cpu *cpu = current_kvm_cpu;
527b7d2f013SSasha Levin 	int fd = kvm_cpu__get_debug_fd();
52843119af7SPekka Enberg 
5294b1c6f6eSSasha Levin 	if (!cpu || cpu->needs_nmi)
53043119af7SPekka Enberg 		return;
53143119af7SPekka Enberg 
532b7d2f013SSasha Levin 	dprintf(fd, "\n #\n # vCPU #%ld's dump:\n #\n", cpu->cpu_id);
53343119af7SPekka Enberg 	kvm_cpu__show_registers(cpu);
53443119af7SPekka Enberg 	kvm_cpu__show_code(cpu);
53543119af7SPekka Enberg 	kvm_cpu__show_page_tables(cpu);
536b5b501ccSIngo Molnar 	fflush(stdout);
537cffeab25SIngo Molnar 	printout_done = 1;
538cffeab25SIngo Molnar 	mb();
53943119af7SPekka Enberg }
54043119af7SPekka Enberg 
541d94e22b9SSasha Levin /* Pause/resume the guest using SIGUSR2 */
542d94e22b9SSasha Levin static int is_paused;
543d94e22b9SSasha Levin 
5444b1addaeSSasha Levin static void handle_pause(int fd, u32 type, u32 len, u8 *msg)
545d94e22b9SSasha Levin {
5465aa502e4SLai Jiangshan 	if (WARN_ON(len))
5475aa502e4SLai Jiangshan 		return;
5485aa502e4SLai Jiangshan 
5497021c50bSAsias He 	if (type == KVM_IPC_RESUME && is_paused) {
5507021c50bSAsias He 		kvm->vm_state = KVM_VMSTATE_RUNNING;
551d94e22b9SSasha Levin 		kvm__continue();
5527021c50bSAsias He 	} else if (type == KVM_IPC_PAUSE && !is_paused) {
5537021c50bSAsias He 		kvm->vm_state = KVM_VMSTATE_PAUSED;
554eb8dad9dSSasha Levin 		ioctl(kvm->vm_fd, KVM_KVMCLOCK_CTRL);
555d94e22b9SSasha Levin 		kvm__pause();
5567021c50bSAsias He 	} else {
55702317b74SSasha Levin 		return;
5585aa502e4SLai Jiangshan 	}
559d94e22b9SSasha Levin 
560d94e22b9SSasha Levin 	is_paused = !is_paused;
561d94e22b9SSasha Levin }
562d94e22b9SSasha Levin 
5637021c50bSAsias He static void handle_vmstate(int fd, u32 type, u32 len, u8 *msg)
5647021c50bSAsias He {
5657021c50bSAsias He 	int r = 0;
5667021c50bSAsias He 
5677021c50bSAsias He 	if (type == KVM_IPC_VMSTATE)
5687021c50bSAsias He 		r = write(fd, &kvm->vm_state, sizeof(kvm->vm_state));
5697021c50bSAsias He 
5707021c50bSAsias He 	if (r < 0)
5717021c50bSAsias He 		pr_warning("Failed sending VMSTATE");
5727021c50bSAsias He }
5737021c50bSAsias He 
5744b1addaeSSasha Levin static void handle_debug(int fd, u32 type, u32 len, u8 *msg)
5759e854d1aSPekka Enberg {
5769e854d1aSPekka Enberg 	int i;
577a59cdf44SLai Jiangshan 	struct debug_cmd_params *params;
578a59cdf44SLai Jiangshan 	u32 dbg_type;
579a59cdf44SLai Jiangshan 	u32 vcpu;
580a59cdf44SLai Jiangshan 
581a59cdf44SLai Jiangshan 	if (WARN_ON(type != KVM_IPC_DEBUG || len != sizeof(*params)))
582a59cdf44SLai Jiangshan 		return;
583a59cdf44SLai Jiangshan 
584a59cdf44SLai Jiangshan 	params = (void *)msg;
585a59cdf44SLai Jiangshan 	dbg_type = params->dbg_type;
586a59cdf44SLai Jiangshan 	vcpu = params->cpu;
5874b1c6f6eSSasha Levin 
588226e727bSSasha Levin 	if (dbg_type & KVM_DEBUG_CMD_TYPE_SYSRQ)
589226e727bSSasha Levin 		serial8250__inject_sysrq(kvm, params->sysrq);
590226e727bSSasha Levin 
5914b1c6f6eSSasha Levin 	if (dbg_type & KVM_DEBUG_CMD_TYPE_NMI) {
5927070414aSSasha Levin 		if ((int)vcpu >= kvm->nrcpus)
5934b1c6f6eSSasha Levin 			return;
5944b1c6f6eSSasha Levin 
5954b1c6f6eSSasha Levin 		kvm_cpus[vcpu]->needs_nmi = 1;
5964b1c6f6eSSasha Levin 		pthread_kill(kvm_cpus[vcpu]->thread, SIGUSR1);
5974b1c6f6eSSasha Levin 	}
5984b1c6f6eSSasha Levin 
5994b1c6f6eSSasha Levin 	if (!(dbg_type & KVM_DEBUG_CMD_TYPE_DUMP))
6004b1c6f6eSSasha Levin 		return;
6019e854d1aSPekka Enberg 
6029e854d1aSPekka Enberg 	for (i = 0; i < nrcpus; i++) {
6039e854d1aSPekka Enberg 		struct kvm_cpu *cpu = kvm_cpus[i];
6049e854d1aSPekka Enberg 
60543119af7SPekka Enberg 		if (!cpu)
60643119af7SPekka Enberg 			continue;
60743119af7SPekka Enberg 
608cffeab25SIngo Molnar 		printout_done = 0;
609b7d2f013SSasha Levin 
610b7d2f013SSasha Levin 		kvm_cpu__set_debug_fd(fd);
61143119af7SPekka Enberg 		pthread_kill(cpu->thread, SIGUSR1);
612cffeab25SIngo Molnar 		/*
613cffeab25SIngo Molnar 		 * Wait for the vCPU to dump state before signalling
614cffeab25SIngo Molnar 		 * the next thread. Since this is debug code it does
615cffeab25SIngo Molnar 		 * not matter that we are burning CPU time a bit:
616cffeab25SIngo Molnar 		 */
617cffeab25SIngo Molnar 		while (!printout_done)
618cffeab25SIngo Molnar 			mb();
6199e854d1aSPekka Enberg 	}
6209e854d1aSPekka Enberg 
621b7d2f013SSasha Levin 	close(fd);
622b7d2f013SSasha Levin 
623226e727bSSasha Levin 	serial8250__inject_sysrq(kvm, 'p');
6249e854d1aSPekka Enberg }
6259e854d1aSPekka Enberg 
6269e854d1aSPekka Enberg static void handle_sigalrm(int sig)
6279e854d1aSPekka Enberg {
6280b69bdefSMatt Evans 	kvm__arch_periodic_poll(kvm);
6299e854d1aSPekka Enberg }
6309e854d1aSPekka Enberg 
6314b1addaeSSasha Levin static void handle_stop(int fd, u32 type, u32 len, u8 *msg)
632daf4cb5aSSasha Levin {
633e333e41aSLai Jiangshan 	if (WARN_ON(type != KVM_IPC_STOP || len))
634e333e41aSLai Jiangshan 		return;
635e333e41aSLai Jiangshan 
636daf4cb5aSSasha Levin 	kvm_cpu__reboot();
637daf4cb5aSSasha Levin }
638daf4cb5aSSasha Levin 
6395ee154d1SPekka Enberg static void *kvm_cpu_thread(void *arg)
6405ee154d1SPekka Enberg {
641d77a9efaSCyrill Gorcunov 	current_kvm_cpu		= arg;
6425ee154d1SPekka Enberg 
643d77a9efaSCyrill Gorcunov 	if (kvm_cpu__start(current_kvm_cpu))
6445ee154d1SPekka Enberg 		goto panic_kvm;
6455ee154d1SPekka Enberg 
6465ee154d1SPekka Enberg 	return (void *) (intptr_t) 0;
6475ee154d1SPekka Enberg 
6485ee154d1SPekka Enberg panic_kvm:
6493fdf659dSSasha Levin 	fprintf(stderr, "KVM exit reason: %u (\"%s\")\n",
650d77a9efaSCyrill Gorcunov 		current_kvm_cpu->kvm_run->exit_reason,
651d77a9efaSCyrill Gorcunov 		kvm_exit_reasons[current_kvm_cpu->kvm_run->exit_reason]);
652d77a9efaSCyrill Gorcunov 	if (current_kvm_cpu->kvm_run->exit_reason == KVM_EXIT_UNKNOWN)
6535ee154d1SPekka Enberg 		fprintf(stderr, "KVM exit code: 0x%Lu\n",
654d77a9efaSCyrill Gorcunov 			current_kvm_cpu->kvm_run->hw.hardware_exit_reason);
6558e5accedSPekka Enberg 
656b7d2f013SSasha Levin 	kvm_cpu__set_debug_fd(STDOUT_FILENO);
657d77a9efaSCyrill Gorcunov 	kvm_cpu__show_registers(current_kvm_cpu);
658d77a9efaSCyrill Gorcunov 	kvm_cpu__show_code(current_kvm_cpu);
659d77a9efaSCyrill Gorcunov 	kvm_cpu__show_page_tables(current_kvm_cpu);
6605ee154d1SPekka Enberg 
6615ee154d1SPekka Enberg 	return (void *) (intptr_t) 1;
6625ee154d1SPekka Enberg }
6635ee154d1SPekka Enberg 
664e08c0896SPrasad Joshi static char kernel[PATH_MAX];
665b0b42ba0SPekka Enberg 
666b0b42ba0SPekka Enberg static const char *host_kernels[] = {
667e08c0896SPrasad Joshi 	"/boot/vmlinuz",
668e08c0896SPrasad Joshi 	"/boot/bzImage",
669e08c0896SPrasad Joshi 	NULL
670e08c0896SPrasad Joshi };
671b0b42ba0SPekka Enberg 
672b0b42ba0SPekka Enberg static const char *default_kernels[] = {
673e08c0896SPrasad Joshi 	"./bzImage",
674b03af790SKonstantin Khlebnikov 	"arch/" BUILD_ARCH "/boot/bzImage",
675af7b0868SMatt Evans 	"../../arch/" BUILD_ARCH "/boot/bzImage",
676e08c0896SPrasad Joshi 	NULL
677e08c0896SPrasad Joshi };
6788329f30bSPekka Enberg 
679b0b42ba0SPekka Enberg static const char *default_vmlinux[] = {
680b03af790SKonstantin Khlebnikov 	"vmlinux",
681b0b42ba0SPekka Enberg 	"../../../vmlinux",
682b0b42ba0SPekka Enberg 	"../../vmlinux",
683b0b42ba0SPekka Enberg 	NULL
684b0b42ba0SPekka Enberg };
685b0b42ba0SPekka Enberg 
686e08c0896SPrasad Joshi static void kernel_usage_with_options(void)
6878329f30bSPekka Enberg {
688e08c0896SPrasad Joshi 	const char **k;
6898329f30bSPekka Enberg 	struct utsname uts;
690e08c0896SPrasad Joshi 
691e08c0896SPrasad Joshi 	fprintf(stderr, "Fatal: could not find default kernel image in:\n");
69265182f37SPrasad Joshi 	k = &default_kernels[0];
693e08c0896SPrasad Joshi 	while (*k) {
694e08c0896SPrasad Joshi 		fprintf(stderr, "\t%s\n", *k);
695e08c0896SPrasad Joshi 		k++;
696e08c0896SPrasad Joshi 	}
697e08c0896SPrasad Joshi 
698e08c0896SPrasad Joshi 	if (uname(&uts) < 0)
699e08c0896SPrasad Joshi 		return;
700e08c0896SPrasad Joshi 
701e08c0896SPrasad Joshi 	k = &host_kernels[0];
702e08c0896SPrasad Joshi 	while (*k) {
703e08c0896SPrasad Joshi 		if (snprintf(kernel, PATH_MAX, "%s-%s", *k, uts.release) < 0)
704e08c0896SPrasad Joshi 			return;
705e08c0896SPrasad Joshi 		fprintf(stderr, "\t%s\n", kernel);
706e08c0896SPrasad Joshi 		k++;
707e08c0896SPrasad Joshi 	}
708ee8b1456SWanlong Gao 	fprintf(stderr, "\nPlease see '%s run --help' for more options.\n\n",
709ee8b1456SWanlong Gao 		KVM_BINARY_NAME);
710e08c0896SPrasad Joshi }
711e08c0896SPrasad Joshi 
71260ded003SPekka Enberg static u64 host_ram_size(void)
71360ded003SPekka Enberg {
71460ded003SPekka Enberg 	long page_size;
71560ded003SPekka Enberg 	long nr_pages;
71660ded003SPekka Enberg 
71760ded003SPekka Enberg 	nr_pages	= sysconf(_SC_PHYS_PAGES);
718d63c5ce6SPekka Enberg 	if (nr_pages < 0) {
7194542f276SCyrill Gorcunov 		pr_warning("sysconf(_SC_PHYS_PAGES) failed");
720d63c5ce6SPekka Enberg 		return 0;
721d63c5ce6SPekka Enberg 	}
72260ded003SPekka Enberg 
72360ded003SPekka Enberg 	page_size	= sysconf(_SC_PAGE_SIZE);
724d63c5ce6SPekka Enberg 	if (page_size < 0) {
7254542f276SCyrill Gorcunov 		pr_warning("sysconf(_SC_PAGE_SIZE) failed");
726d63c5ce6SPekka Enberg 		return 0;
727d63c5ce6SPekka Enberg 	}
72860ded003SPekka Enberg 
72960ded003SPekka Enberg 	return (nr_pages * page_size) >> MB_SHIFT;
73060ded003SPekka Enberg }
73160ded003SPekka Enberg 
73218bd8c3bSPekka Enberg /*
73318bd8c3bSPekka Enberg  * If user didn't specify how much memory it wants to allocate for the guest,
73418bd8c3bSPekka Enberg  * avoid filling the whole host RAM.
73518bd8c3bSPekka Enberg  */
73618bd8c3bSPekka Enberg #define RAM_SIZE_RATIO		0.8
73718bd8c3bSPekka Enberg 
738fd834defSPekka Enberg static u64 get_ram_size(int nr_cpus)
739fd834defSPekka Enberg {
74006761c76SPekka Enberg 	u64 available;
74106761c76SPekka Enberg 	u64 ram_size;
742fd834defSPekka Enberg 
743fd834defSPekka Enberg 	ram_size	= 64 * (nr_cpus + 3);
744fd834defSPekka Enberg 
74560ded003SPekka Enberg 	available	= host_ram_size() * RAM_SIZE_RATIO;
746d63c5ce6SPekka Enberg 	if (!available)
747d63c5ce6SPekka Enberg 		available = MIN_RAM_SIZE_MB;
748fd834defSPekka Enberg 
749fd834defSPekka Enberg 	if (ram_size > available)
750fd834defSPekka Enberg 		ram_size	= available;
751fd834defSPekka Enberg 
752fd834defSPekka Enberg 	return ram_size;
753fd834defSPekka Enberg }
754fd834defSPekka Enberg 
755e08c0896SPrasad Joshi static const char *find_kernel(void)
756e08c0896SPrasad Joshi {
757e08c0896SPrasad Joshi 	const char **k;
7588329f30bSPekka Enberg 	struct stat st;
759e08c0896SPrasad Joshi 	struct utsname uts;
760e08c0896SPrasad Joshi 
76165182f37SPrasad Joshi 	k = &default_kernels[0];
762e08c0896SPrasad Joshi 	while (*k) {
763e08c0896SPrasad Joshi 		if (stat(*k, &st) < 0 || !S_ISREG(st.st_mode)) {
764e08c0896SPrasad Joshi 			k++;
765e08c0896SPrasad Joshi 			continue;
766e08c0896SPrasad Joshi 		}
767e08c0896SPrasad Joshi 		strncpy(kernel, *k, PATH_MAX);
768e08c0896SPrasad Joshi 		return kernel;
769e08c0896SPrasad Joshi 	}
7708329f30bSPekka Enberg 
7718329f30bSPekka Enberg 	if (uname(&uts) < 0)
7728329f30bSPekka Enberg 		return NULL;
7738329f30bSPekka Enberg 
774e08c0896SPrasad Joshi 	k = &host_kernels[0];
775e08c0896SPrasad Joshi 	while (*k) {
776e08c0896SPrasad Joshi 		if (snprintf(kernel, PATH_MAX, "%s-%s", *k, uts.release) < 0)
7778329f30bSPekka Enberg 			return NULL;
7788329f30bSPekka Enberg 
779e08c0896SPrasad Joshi 		if (stat(kernel, &st) < 0 || !S_ISREG(st.st_mode)) {
780e08c0896SPrasad Joshi 			k++;
781e08c0896SPrasad Joshi 			continue;
782e08c0896SPrasad Joshi 		}
783e08c0896SPrasad Joshi 		return kernel;
7848329f30bSPekka Enberg 
785e08c0896SPrasad Joshi 	}
7868329f30bSPekka Enberg 	return NULL;
7878329f30bSPekka Enberg }
7888329f30bSPekka Enberg 
789b0b42ba0SPekka Enberg static const char *find_vmlinux(void)
790b0b42ba0SPekka Enberg {
791b0b42ba0SPekka Enberg 	const char **vmlinux;
792b0b42ba0SPekka Enberg 
793b0b42ba0SPekka Enberg 	vmlinux = &default_vmlinux[0];
794b0b42ba0SPekka Enberg 	while (*vmlinux) {
795b0b42ba0SPekka Enberg 		struct stat st;
796b0b42ba0SPekka Enberg 
797b0b42ba0SPekka Enberg 		if (stat(*vmlinux, &st) < 0 || !S_ISREG(st.st_mode)) {
798b0b42ba0SPekka Enberg 			vmlinux++;
799b0b42ba0SPekka Enberg 			continue;
800b0b42ba0SPekka Enberg 		}
801b0b42ba0SPekka Enberg 		return *vmlinux;
802b0b42ba0SPekka Enberg 	}
803b0b42ba0SPekka Enberg 	return NULL;
804b0b42ba0SPekka Enberg }
805b0b42ba0SPekka Enberg 
806f6677a1dSAmerigo Wang void kvm_run_help(void)
807f6677a1dSAmerigo Wang {
808f6677a1dSAmerigo Wang 	usage_with_options(run_usage, options);
809f6677a1dSAmerigo Wang }
810f6677a1dSAmerigo Wang 
811*afc2c7c0SAsias He static int kvm_setup_guest_init(void)
8129cec19c8SSasha Levin {
813cb540c93SSasha Levin 	const char *rootfs = custom_rootfs_name;
814*afc2c7c0SAsias He 	char tmp[PATH_MAX];
815*afc2c7c0SAsias He 	size_t size;
816*afc2c7c0SAsias He 	int fd, ret;
817*afc2c7c0SAsias He 	char *data;
8189cec19c8SSasha Levin 
819*afc2c7c0SAsias He 	/* Setup /virt/init */
820*afc2c7c0SAsias He 	size = (size_t)&_binary_guest_init_size;
821*afc2c7c0SAsias He 	data = (char *)&_binary_guest_init_start;
822*afc2c7c0SAsias He 	snprintf(tmp, PATH_MAX, "%s%s/virt/init", kvm__get_dir(), rootfs);
823*afc2c7c0SAsias He 	remove(tmp);
824*afc2c7c0SAsias He 	fd = open(tmp, O_CREAT | O_WRONLY, 0755);
825*afc2c7c0SAsias He 	if (fd < 0)
826*afc2c7c0SAsias He 		die("Fail to setup %s", tmp);
827*afc2c7c0SAsias He 	ret = xwrite(fd, data, size);
828*afc2c7c0SAsias He 	if (ret < 0)
829*afc2c7c0SAsias He 		die("Fail to setup %s", tmp);
830*afc2c7c0SAsias He 	close(fd);
8319cec19c8SSasha Levin 
832*afc2c7c0SAsias He 	/* Setup /virt/init_stage2 */
833*afc2c7c0SAsias He 	size = (size_t)&_binary_guest_init_stage2_size;
834*afc2c7c0SAsias He 	data = (char *)&_binary_guest_init_stage2_start;
8359cec19c8SSasha Levin 	snprintf(tmp, PATH_MAX, "%s%s/virt/init_stage2", kvm__get_dir(), rootfs);
8369cec19c8SSasha Levin 	remove(tmp);
837*afc2c7c0SAsias He 	fd = open(tmp, O_CREAT | O_WRONLY, 0755);
838*afc2c7c0SAsias He 	if (fd < 0)
839*afc2c7c0SAsias He 		die("Fail to setup %s", tmp);
840*afc2c7c0SAsias He 	ret = xwrite(fd, data, size);
841*afc2c7c0SAsias He 	if (ret < 0)
842*afc2c7c0SAsias He 		die("Fail to setup %s", tmp);
843*afc2c7c0SAsias He 	close(fd);
8449cec19c8SSasha Levin 
845*afc2c7c0SAsias He 	return 0;
8469cec19c8SSasha Levin }
8479cec19c8SSasha Levin 
848d50fe489SSasha Levin static int kvm_run_set_sandbox(void)
849d50fe489SSasha Levin {
850cb540c93SSasha Levin 	const char *guestfs_name = custom_rootfs_name;
851d50fe489SSasha Levin 	char path[PATH_MAX], script[PATH_MAX], *tmp;
852d50fe489SSasha Levin 
853d50fe489SSasha Levin 	snprintf(path, PATH_MAX, "%s%s/virt/sandbox.sh", kvm__get_dir(), guestfs_name);
854d50fe489SSasha Levin 
855d50fe489SSasha Levin 	remove(path);
856d50fe489SSasha Levin 
857d50fe489SSasha Levin 	if (sandbox == NULL)
858d50fe489SSasha Levin 		return 0;
859d50fe489SSasha Levin 
860d50fe489SSasha Levin 	tmp = realpath(sandbox, NULL);
861d50fe489SSasha Levin 	if (tmp == NULL)
862d50fe489SSasha Levin 		return -ENOMEM;
863d50fe489SSasha Levin 
864d50fe489SSasha Levin 	snprintf(script, PATH_MAX, "/host/%s", tmp);
865d50fe489SSasha Levin 	free(tmp);
866d50fe489SSasha Levin 
867d50fe489SSasha Levin 	return symlink(script, path);
868d50fe489SSasha Levin }
869d50fe489SSasha Levin 
8705173b4afSLai Jiangshan static void kvm_write_sandbox_cmd_exactly(int fd, const char *arg)
8715173b4afSLai Jiangshan {
8725173b4afSLai Jiangshan 	const char *single_quote;
8735173b4afSLai Jiangshan 
8745173b4afSLai Jiangshan 	if (!*arg) { /* zero length string */
8755173b4afSLai Jiangshan 		if (write(fd, "''", 2) <= 0)
8765173b4afSLai Jiangshan 			die("Failed writing sandbox script");
8775173b4afSLai Jiangshan 		return;
8785173b4afSLai Jiangshan 	}
8795173b4afSLai Jiangshan 
8805173b4afSLai Jiangshan 	while (*arg) {
8815173b4afSLai Jiangshan 		single_quote = strchrnul(arg, '\'');
8825173b4afSLai Jiangshan 
8835173b4afSLai Jiangshan 		/* write non-single-quote string as #('string') */
8845173b4afSLai Jiangshan 		if (arg != single_quote) {
8855173b4afSLai Jiangshan 			if (write(fd, "'", 1) <= 0 ||
8865173b4afSLai Jiangshan 			    write(fd, arg, single_quote - arg) <= 0 ||
8875173b4afSLai Jiangshan 			    write(fd, "'", 1) <= 0)
8885173b4afSLai Jiangshan 				die("Failed writing sandbox script");
8895173b4afSLai Jiangshan 		}
8905173b4afSLai Jiangshan 
8915173b4afSLai Jiangshan 		/* write single quote as #("'") */
8925173b4afSLai Jiangshan 		if (*single_quote) {
8935173b4afSLai Jiangshan 			if (write(fd, "\"'\"", 3) <= 0)
8945173b4afSLai Jiangshan 				die("Failed writing sandbox script");
8955173b4afSLai Jiangshan 		} else
8965173b4afSLai Jiangshan 			break;
8975173b4afSLai Jiangshan 
8985173b4afSLai Jiangshan 		arg = single_quote + 1;
8995173b4afSLai Jiangshan 	}
9005173b4afSLai Jiangshan }
9015173b4afSLai Jiangshan 
9025cd19aa0SPekka Enberg static void resolve_program(const char *src, char *dst, size_t len)
9035cd19aa0SPekka Enberg {
9045cd19aa0SPekka Enberg 	struct stat st;
905c2c742d9SPekka Enberg 	int err;
9065cd19aa0SPekka Enberg 
907c2c742d9SPekka Enberg 	err = stat(src, &st);
9085cd19aa0SPekka Enberg 
909c2c742d9SPekka Enberg 	if (!err && S_ISREG(st.st_mode)) {
9105cd19aa0SPekka Enberg 		char resolved_path[PATH_MAX];
9115cd19aa0SPekka Enberg 
912de3f75c9SPekka Enberg 		if (!realpath(src, resolved_path))
913de3f75c9SPekka Enberg 			die("Unable to resolve program %s: %s\n", src, strerror(errno));
9145cd19aa0SPekka Enberg 
9155cd19aa0SPekka Enberg 		snprintf(dst, len, "/host%s", resolved_path);
9165cd19aa0SPekka Enberg 	} else
9175cd19aa0SPekka Enberg 		strncpy(dst, src, len);
9185cd19aa0SPekka Enberg }
9195cd19aa0SPekka Enberg 
9203c29e2aaSSasha Levin static void kvm_run_write_sandbox_cmd(const char **argv, int argc)
9213c29e2aaSSasha Levin {
9223c29e2aaSSasha Levin 	const char script_hdr[] = "#! /bin/bash\n\n";
9235cd19aa0SPekka Enberg 	char program[PATH_MAX];
9243c29e2aaSSasha Levin 	int fd;
9253c29e2aaSSasha Levin 
9263c29e2aaSSasha Levin 	remove(sandbox);
9273c29e2aaSSasha Levin 
9283c29e2aaSSasha Levin 	fd = open(sandbox, O_RDWR | O_CREAT, 0777);
9293c29e2aaSSasha Levin 	if (fd < 0)
9303c29e2aaSSasha Levin 		die("Failed creating sandbox script");
9313c29e2aaSSasha Levin 
9323c29e2aaSSasha Levin 	if (write(fd, script_hdr, sizeof(script_hdr) - 1) <= 0)
9333c29e2aaSSasha Levin 		die("Failed writing sandbox script");
9343c29e2aaSSasha Levin 
9355cd19aa0SPekka Enberg 	resolve_program(argv[0], program, PATH_MAX);
9365cd19aa0SPekka Enberg 	kvm_write_sandbox_cmd_exactly(fd, program);
9375cd19aa0SPekka Enberg 
9385cd19aa0SPekka Enberg 	argv++;
9395cd19aa0SPekka Enberg 	argc--;
9405cd19aa0SPekka Enberg 
9413c29e2aaSSasha Levin 	while (argc) {
9423c29e2aaSSasha Levin 		if (write(fd, " ", 1) <= 0)
9433c29e2aaSSasha Levin 			die("Failed writing sandbox script");
9445cd19aa0SPekka Enberg 
9455cd19aa0SPekka Enberg 		kvm_write_sandbox_cmd_exactly(fd, argv[0]);
9463c29e2aaSSasha Levin 		argv++;
9473c29e2aaSSasha Levin 		argc--;
9483c29e2aaSSasha Levin 	}
9493c29e2aaSSasha Levin 	if (write(fd, "\n", 1) <= 0)
9503c29e2aaSSasha Levin 		die("Failed writing sandbox script");
9513c29e2aaSSasha Levin 
9523c29e2aaSSasha Levin 	close(fd);
9533c29e2aaSSasha Levin }
9543c29e2aaSSasha Levin 
955e1e46fe6SSasha Levin static int kvm_cmd_run_init(int argc, const char **argv)
956f967c427SPrasad Joshi {
9572d96f6b6SSasha Levin 	static char real_cmdline[2048], default_name[20];
958aba1efa5SPekka Enberg 	struct framebuffer *fb = NULL;
959384922b3SPekka Enberg 	unsigned int nr_online_cpus;
9608259b8ccSSasha Levin 	int max_cpus, recommended_cpus;
9614932d174SSasha Levin 	int i, r;
962f967c427SPrasad Joshi 
9635ee154d1SPekka Enberg 	signal(SIGALRM, handle_sigalrm);
9644b1addaeSSasha Levin 	kvm_ipc__register_handler(KVM_IPC_DEBUG, handle_debug);
96543119af7SPekka Enberg 	signal(SIGUSR1, handle_sigusr1);
9664b1addaeSSasha Levin 	kvm_ipc__register_handler(KVM_IPC_PAUSE, handle_pause);
9674b1addaeSSasha Levin 	kvm_ipc__register_handler(KVM_IPC_RESUME, handle_pause);
9684b1addaeSSasha Levin 	kvm_ipc__register_handler(KVM_IPC_STOP, handle_stop);
9697021c50bSAsias He 	kvm_ipc__register_handler(KVM_IPC_VMSTATE, handle_vmstate);
970f967c427SPrasad Joshi 
971cfd63bbbSSasha Levin 	nr_online_cpus = sysconf(_SC_NPROCESSORS_ONLN);
972cfd63bbbSSasha Levin 
973f967c427SPrasad Joshi 	while (argc != 0) {
974f967c427SPrasad Joshi 		argc = parse_options(argc, argv, options, run_usage,
9751a007c82SSasha Levin 				PARSE_OPT_STOP_AT_NON_OPTION |
9761a007c82SSasha Levin 				PARSE_OPT_KEEP_DASHDASH);
977f967c427SPrasad Joshi 		if (argc != 0) {
9781a007c82SSasha Levin 			/* Cusrom options, should have been handled elsewhere */
9793c29e2aaSSasha Levin 			if (strcmp(argv[0], "--") == 0) {
9803c29e2aaSSasha Levin 				if (kvm_run_wrapper == KVM_RUN_SANDBOX) {
9813c29e2aaSSasha Levin 					sandbox = DEFAULT_SANDBOX_FILENAME;
9823c29e2aaSSasha Levin 					kvm_run_write_sandbox_cmd(argv+1, argc-1);
9831a007c82SSasha Levin 					break;
9843c29e2aaSSasha Levin 				}
9853c29e2aaSSasha Levin 			}
9861a007c82SSasha Levin 
987e0747665SSasha Levin 			if ((kvm_run_wrapper == KVM_RUN_DEFAULT && kernel_filename) ||
988e0747665SSasha Levin 				(kvm_run_wrapper == KVM_RUN_SANDBOX && sandbox)) {
989f967c427SPrasad Joshi 				fprintf(stderr, "Cannot handle parameter: "
990f967c427SPrasad Joshi 						"%s\n", argv[0]);
991f967c427SPrasad Joshi 				usage_with_options(run_usage, options);
992e120b624SPaul Neumann 				return -EINVAL;
993f967c427SPrasad Joshi 			}
994e0747665SSasha Levin 			if (kvm_run_wrapper == KVM_RUN_SANDBOX) {
995e0747665SSasha Levin 				/*
996e0747665SSasha Levin 				 * first unhandled parameter is treated as
997e0747665SSasha Levin 				 * sandbox command
998e0747665SSasha Levin 				 */
999e0747665SSasha Levin 				sandbox = DEFAULT_SANDBOX_FILENAME;
1000e0747665SSasha Levin 				kvm_run_write_sandbox_cmd(argv, argc);
1001e0747665SSasha Levin 			} else {
1002e0747665SSasha Levin 				/*
1003e0747665SSasha Levin 				 * first unhandled parameter is treated as a kernel
1004e0747665SSasha Levin 				 * image
1005f967c427SPrasad Joshi 				 */
1006f967c427SPrasad Joshi 				kernel_filename = argv[0];
1007e0747665SSasha Levin 			}
1008f967c427SPrasad Joshi 			argv++;
1009f967c427SPrasad Joshi 			argc--;
1010f967c427SPrasad Joshi 		}
1011f967c427SPrasad Joshi 
1012f967c427SPrasad Joshi 	}
1013f967c427SPrasad Joshi 
101445bc2f02SPekka Enberg 	if (!kernel_filename)
1015e08c0896SPrasad Joshi 		kernel_filename = find_kernel();
10168329f30bSPekka Enberg 
10178329f30bSPekka Enberg 	if (!kernel_filename) {
1018e08c0896SPrasad Joshi 		kernel_usage_with_options();
1019e120b624SPaul Neumann 		return -EINVAL;
10208329f30bSPekka Enberg 	}
10218329f30bSPekka Enberg 
1022b0b42ba0SPekka Enberg 	vmlinux_filename = find_vmlinux();
1023b0b42ba0SPekka Enberg 
1024cfd63bbbSSasha Levin 	if (nrcpus == 0)
1025cfd63bbbSSasha Levin 		nrcpus = nr_online_cpus;
1026d77a9efaSCyrill Gorcunov 
1027fd834defSPekka Enberg 	if (!ram_size)
1028fd834defSPekka Enberg 		ram_size	= get_ram_size(nrcpus);
1029fd834defSPekka Enberg 
1030a2a002f9SIngo Molnar 	if (ram_size < MIN_RAM_SIZE_MB)
1031a2a002f9SIngo Molnar 		die("Not enough memory specified: %lluMB (min %lluMB)", ram_size, MIN_RAM_SIZE_MB);
1032a2a002f9SIngo Molnar 
103360ded003SPekka Enberg 	if (ram_size > host_ram_size())
10344542f276SCyrill Gorcunov 		pr_warning("Guest memory size %lluMB exceeds host physical RAM size %lluMB", ram_size, host_ram_size());
103560ded003SPekka Enberg 
1036f967c427SPrasad Joshi 	ram_size <<= MB_SHIFT;
1037f967c427SPrasad Joshi 
10385929637bSAsias He 	if (!dev)
10395929637bSAsias He 		dev = DEFAULT_KVM_DEV;
1040f967c427SPrasad Joshi 
10419aa4a0ebSAsias He 	if (!console)
10429aa4a0ebSAsias He 		console = DEFAULT_CONSOLE;
10439aa4a0ebSAsias He 
10449aa4a0ebSAsias He 	if (!strncmp(console, "virtio", 6))
1045f967c427SPrasad Joshi 		active_console  = CONSOLE_VIRTIO;
10463bbc49b6SMatt Evans 	else if (!strncmp(console, "serial", 6))
10479aa4a0ebSAsias He 		active_console  = CONSOLE_8250;
10483bbc49b6SMatt Evans 	else if (!strncmp(console, "hv", 2))
10493bbc49b6SMatt Evans 		active_console = CONSOLE_HV;
10503bbc49b6SMatt Evans 	else
10513bbc49b6SMatt Evans 		pr_warning("No console!");
1052f967c427SPrasad Joshi 
1053e80ddf6aSAsias He 	if (!host_ip)
1054e80ddf6aSAsias He 		host_ip = DEFAULT_HOST_ADDR;
10554d67c820SSasha Levin 
1056bb8ffd2fSAsias He 	if (!guest_ip)
1057bb8ffd2fSAsias He 		guest_ip = DEFAULT_GUEST_ADDR;
1058bb8ffd2fSAsias He 
1059a4e724ddSSasha Levin 	if (!guest_mac)
1060a4e724ddSSasha Levin 		guest_mac = DEFAULT_GUEST_MAC;
1061a4e724ddSSasha Levin 
1062d7098b9bSAsias He 	if (!host_mac)
1063d7098b9bSAsias He 		host_mac = DEFAULT_HOST_MAC;
1064d7098b9bSAsias He 
106573b7d038SAmos Kong 	if (!script)
106673b7d038SAmos Kong 		script = DEFAULT_SCRIPT;
106773b7d038SAmos Kong 
1068f967c427SPrasad Joshi 	term_init();
1069f967c427SPrasad Joshi 
10702d96f6b6SSasha Levin 	if (!guest_name) {
1071587a4d17SLai Jiangshan 		if (custom_rootfs) {
1072587a4d17SLai Jiangshan 			guest_name = custom_rootfs_name;
1073587a4d17SLai Jiangshan 		} else {
10742d96f6b6SSasha Levin 			sprintf(default_name, "guest-%u", getpid());
10752d96f6b6SSasha Levin 			guest_name = default_name;
10762d96f6b6SSasha Levin 		}
1077587a4d17SLai Jiangshan 	}
10782d96f6b6SSasha Levin 
107961061257SMatt Evans 	kvm = kvm__init(dev, hugetlbfs_path, ram_size, guest_name);
1080d648dbf5SCyrill Gorcunov 	if (IS_ERR(kvm)) {
1081d648dbf5SCyrill Gorcunov 		r = PTR_ERR(kvm);
1082d648dbf5SCyrill Gorcunov 		goto fail;
1083d648dbf5SCyrill Gorcunov 	}
1084f967c427SPrasad Joshi 
10856d6a4d41SPekka Enberg 	kvm->single_step = single_step;
10866d6a4d41SPekka Enberg 
1087ea6eeb1cSSasha Levin 	r = ioeventfd__init(kvm);
1088ea6eeb1cSSasha Levin 	if (r < 0) {
1089ea6eeb1cSSasha Levin 		pr_err("ioeventfd__init() failed with error %d\n", r);
1090ea6eeb1cSSasha Levin 		goto fail;
1091ea6eeb1cSSasha Levin 	}
109237f3d50eSSasha Levin 
1093384922b3SPekka Enberg 	max_cpus = kvm__max_cpus(kvm);
10948259b8ccSSasha Levin 	recommended_cpus = kvm__recommended_cpus(kvm);
1095384922b3SPekka Enberg 
1096384922b3SPekka Enberg 	if (nrcpus > max_cpus) {
1097384922b3SPekka Enberg 		printf("  # Limit the number of CPUs to %d\n", max_cpus);
109890c05188SMatt Evans 		nrcpus = max_cpus;
10998259b8ccSSasha Levin 	} else if (nrcpus > recommended_cpus) {
11008259b8ccSSasha Levin 		printf("  # Warning: The maximum recommended amount of VCPUs"
11018259b8ccSSasha Levin 			" is %d\n", recommended_cpus);
1102384922b3SPekka Enberg 	}
1103384922b3SPekka Enberg 
11040c7c14a7SCyrill Gorcunov 	kvm->nrcpus = nrcpus;
11050c7c14a7SCyrill Gorcunov 
1106e2077857SMatt Evans 	/* Alloc one pointer too many, so array ends up 0-terminated */
1107e2077857SMatt Evans 	kvm_cpus = calloc(nrcpus + 1, sizeof(void *));
1108e2077857SMatt Evans 	if (!kvm_cpus)
1109e2077857SMatt Evans 		die("Couldn't allocate array for %d CPUs", nrcpus);
1110e2077857SMatt Evans 
1111e3c4f8aaSSasha Levin 	r = irq__init(kvm);
1112e3c4f8aaSSasha Levin 	if (r < 0) {
1113e3c4f8aaSSasha Levin 		pr_err("irq__init() failed with error %d\n", r);
1114e3c4f8aaSSasha Levin 		goto fail;
1115e3c4f8aaSSasha Levin 	}
111619e6c8b8SMatt Evans 
11176d987703SSasha Levin 	r = pci__init(kvm);
11186d987703SSasha Levin 	if (r < 0) {
11196d987703SSasha Levin 		pr_err("pci__init() failed with error %d\n", r);
11206d987703SSasha Levin 		goto fail;
11216d987703SSasha Levin 	}
1122b91be965SMatt Evans 
11237af40b91SSasha Levin 	r = ioport__init(kvm);
11247af40b91SSasha Levin 	if (r < 0) {
11257af40b91SSasha Levin 		pr_err("ioport__init() failed with error %d\n", r);
11267af40b91SSasha Levin 		goto fail;
11277af40b91SSasha Levin 	}
11287af40b91SSasha Levin 
1129890364f8SCyrill Gorcunov 	/*
1130890364f8SCyrill Gorcunov 	 * vidmode should be either specified
1131890364f8SCyrill Gorcunov 	 * either set by default
1132890364f8SCyrill Gorcunov 	 */
1133890364f8SCyrill Gorcunov 	if (vnc || sdl) {
1134890364f8SCyrill Gorcunov 		if (vidmode == -1)
1135890364f8SCyrill Gorcunov 			vidmode = 0x312;
113648d9e01aSSasha Levin 	} else {
1137890364f8SCyrill Gorcunov 		vidmode = 0;
113848d9e01aSSasha Levin 	}
1139890364f8SCyrill Gorcunov 
114026c853e4SPrasad Joshi 	memset(real_cmdline, 0, sizeof(real_cmdline));
11418e704a7aSMatt Evans 	kvm__arch_set_cmdline(real_cmdline, vnc || sdl);
11428e704a7aSMatt Evans 
11438e704a7aSMatt Evans 	if (strlen(real_cmdline) > 0)
1144d74181ccSSasha Levin 		strcat(real_cmdline, " ");
11458e704a7aSMatt Evans 
114626c853e4SPrasad Joshi 	if (kernel_cmdline)
114726c853e4SPrasad Joshi 		strlcat(real_cmdline, kernel_cmdline, sizeof(real_cmdline));
114826c853e4SPrasad Joshi 
114997f16d66SAsias He 	if (!using_rootfs && !disk_image[0].filename && !initrd_filename) {
1150c8675741SSasha Levin 		char tmp[PATH_MAX];
11516df1471eSPekka Enberg 
1152cb540c93SSasha Levin 		kvm_setup_create_new(custom_rootfs_name);
1153cb540c93SSasha Levin 		kvm_setup_resolv(custom_rootfs_name);
1154c8675741SSasha Levin 
11559667701cSPekka Enberg 		snprintf(tmp, PATH_MAX, "%s%s", kvm__get_dir(), "default");
1156c8675741SSasha Levin 		if (virtio_9p__register(kvm, tmp, "/dev/root") < 0)
1157c8675741SSasha Levin 			die("Unable to initialize virtio 9p");
1158c8675741SSasha Levin 		if (virtio_9p__register(kvm, "/", "hostfs") < 0)
1159c8675741SSasha Levin 			die("Unable to initialize virtio 9p");
1160c8675741SSasha Levin 		using_rootfs = custom_rootfs = 1;
116126c853e4SPrasad Joshi 	}
116226c853e4SPrasad Joshi 
116382d65b5eSSasha Levin 	if (using_rootfs) {
1164ff42603fSSasha Levin 		strcat(real_cmdline, " root=/dev/root rw rootflags=rw,trans=virtio,version=9p2000.L rootfstype=9p");
1165a8e6b4b9SSasha Levin 		if (custom_rootfs) {
1166d50fe489SSasha Levin 			kvm_run_set_sandbox();
1167d50fe489SSasha Levin 
1168a8e6b4b9SSasha Levin 			strcat(real_cmdline, " init=/virt/init");
1169d50fe489SSasha Levin 
1170a8e6b4b9SSasha Levin 			if (!no_dhcp)
1171a8e6b4b9SSasha Levin 				strcat(real_cmdline, "  ip=dhcp");
1172*afc2c7c0SAsias He 			if (kvm_setup_guest_init())
1173*afc2c7c0SAsias He 				die("Failed to setup init for guest.");
1174a8e6b4b9SSasha Levin 		}
117582d65b5eSSasha Levin 	} else if (!strstr(real_cmdline, "root=")) {
1176ff42603fSSasha Levin 		strlcat(real_cmdline, " root=/dev/vda rw ", sizeof(real_cmdline));
117782d65b5eSSasha Levin 	}
117859aa2d30SSasha Levin 
1179c1ed214eSPrasad Joshi 	if (image_count) {
1180bcb6aacaSPrasad Joshi 		kvm->nr_disks = image_count;
118197f16d66SAsias He 		kvm->disks = disk_image__open_all((struct disk_image_params *)&disk_image, image_count);
11829f9207c5SSasha Levin 		if (IS_ERR(kvm->disks)) {
11839f9207c5SSasha Levin 			r = PTR_ERR(kvm->disks);
11849f9207c5SSasha Levin 			pr_err("disk_image__open_all() failed with error %ld\n",
11859f9207c5SSasha Levin 					PTR_ERR(kvm->disks));
11869f9207c5SSasha Levin 			goto fail;
11879f9207c5SSasha Levin 		}
1188f967c427SPrasad Joshi 	}
1189c1ed214eSPrasad Joshi 
1190ee8b1456SWanlong Gao 	printf("  # %s run -k %s -m %Lu -c %d --name %s\n", KVM_BINARY_NAME,
1191ee8b1456SWanlong Gao 		kernel_filename, ram_size / 1024 / 1024, nrcpus, guest_name);
1192471c6facSPekka Enberg 
11935ad8db5eSPekka Enberg 	if (!firmware_filename) {
11945ad8db5eSPekka Enberg 		if (!kvm__load_kernel(kvm, kernel_filename,
11955ad8db5eSPekka Enberg 				initrd_filename, real_cmdline, vidmode))
1196f967c427SPrasad Joshi 			die("unable to load kernel %s", kernel_filename);
1197f967c427SPrasad Joshi 
1198b0b42ba0SPekka Enberg 		kvm->vmlinux = vmlinux_filename;
1199807b77b9SCyrill Gorcunov 		r = symbol_init(kvm);
1200b56f1728SCyrill Gorcunov 		if (r < 0)
1201c4b716ecSPekka Enberg 			pr_debug("symbol_init() failed with error %d\n", r);
12025ad8db5eSPekka Enberg 	}
1203b0b42ba0SPekka Enberg 
1204af7b0868SMatt Evans 	ioport__setup_arch();
1205ac38f433SPekka Enberg 
120620c39545SSasha Levin 	r = rtc__init(kvm);
120720c39545SSasha Levin 	if (r < 0) {
120820c39545SSasha Levin 		pr_err("rtc__init() failed with error %d\n", r);
120920c39545SSasha Levin 		goto fail;
121020c39545SSasha Levin 	}
121164136c1cSPekka Enberg 
121220715a22SSasha Levin 	r = serial8250__init(kvm);
121320715a22SSasha Levin 	if (r < 0) {
121420715a22SSasha Levin 		pr_err("serial__init() failed with error %d\n", r);
121520715a22SSasha Levin 		goto fail;
121620715a22SSasha Levin 	}
1217f967c427SPrasad Joshi 
12189f9207c5SSasha Levin 	r = virtio_blk__init(kvm);
12199f9207c5SSasha Levin 	if (r < 0) {
12209f9207c5SSasha Levin 		pr_err("virtio_blk__init() failed with error %d\n", r);
12219f9207c5SSasha Levin 		goto fail;
12229f9207c5SSasha Levin 	}
12239f9207c5SSasha Levin 
1224a67da3beSAsias He 	r = virtio_scsi_init(kvm);
1225a67da3beSAsias He 	if (r < 0) {
1226a67da3beSAsias He 		pr_err("virtio_scsi_init() failed with error %d\n", r);
1227a67da3beSAsias He 		goto fail;
1228a67da3beSAsias He 	}
1229a67da3beSAsias He 
1230a67da3beSAsias He 
12311621292eSSasha Levin 	if (active_console == CONSOLE_VIRTIO)
1232f967c427SPrasad Joshi 		virtio_console__init(kvm);
1233f967c427SPrasad Joshi 
123453eca082SSasha Levin 	if (virtio_rng)
123553eca082SSasha Levin 		virtio_rng__init(kvm);
123653eca082SSasha Levin 
123782d2f21eSSasha Levin 	if (balloon)
123882d2f21eSSasha Levin 		virtio_bln__init(kvm);
123982d2f21eSSasha Levin 
12404f56d42cSAsias He 	if (!network)
12414f56d42cSAsias He 		network = DEFAULT_NETWORK;
12424f56d42cSAsias He 
1243c7838fbdSSasha Levin 	virtio_9p__init(kvm);
1244c7838fbdSSasha Levin 
12459a6d73f1SSasha Levin 	for (i = 0; i < num_net_devices; i++) {
12469a6d73f1SSasha Levin 		net_params[i].kvm = kvm;
12479a6d73f1SSasha Levin 		virtio_net__init(&net_params[i]);
12489a6d73f1SSasha Levin 	}
1249a4e724ddSSasha Levin 
12509a6d73f1SSasha Levin 	if (num_net_devices == 0 && no_net == 0) {
12519a6d73f1SSasha Levin 		struct virtio_net_params net_params;
12529a6d73f1SSasha Levin 
12539a6d73f1SSasha Levin 		net_params = (struct virtio_net_params) {
12549a6d73f1SSasha Levin 			.guest_ip	= guest_ip,
12559a6d73f1SSasha Levin 			.host_ip	= host_ip,
12569a6d73f1SSasha Levin 			.kvm		= kvm,
12579a6d73f1SSasha Levin 			.script		= script,
12589a6d73f1SSasha Levin 			.mode		= NET_MODE_USER,
12599a6d73f1SSasha Levin 		};
12609a6d73f1SSasha Levin 		str_to_mac(guest_mac, net_params.guest_mac);
12619a6d73f1SSasha Levin 		str_to_mac(host_mac, net_params.host_mac);
12629a6d73f1SSasha Levin 
1263bdfcfca6SSasha Levin 		virtio_net__init(&net_params);
1264bdfcfca6SSasha Levin 	}
12654f56d42cSAsias He 
1266839051d9SSasha Levin 	kvm__init_ram(kvm);
1267839051d9SSasha Levin 
126857d7832bSMatt Evans #ifdef CONFIG_X86
1269714e5b7fSSasha Levin 	kbd__init(kvm);
127057d7832bSMatt Evans #endif
1271714e5b7fSSasha Levin 
127295d13a52SSasha Levin 	pci_shmem__init(kvm);
127395d13a52SSasha Levin 
127448d9e01aSSasha Levin 	if (vnc || sdl) {
12753f838fecSPekka Enberg 		fb = vesa__init(kvm);
127648d9e01aSSasha Levin 		if (IS_ERR(fb)) {
127748d9e01aSSasha Levin 			pr_err("vesa__init() failed with error %ld\n", PTR_ERR(fb));
127848d9e01aSSasha Levin 			goto fail;
127948d9e01aSSasha Levin 		}
12803f838fecSPekka Enberg 	}
12813f838fecSPekka Enberg 
128248d9e01aSSasha Levin 	if (vnc && fb) {
128348d9e01aSSasha Levin 		r = vnc__init(fb);
128448d9e01aSSasha Levin 		if (r < 0) {
128548d9e01aSSasha Levin 			pr_err("vnc__init() failed with error %d\n", r);
128648d9e01aSSasha Levin 			goto fail;
128748d9e01aSSasha Levin 		}
128848d9e01aSSasha Levin 	}
128948d9e01aSSasha Levin 
129048d9e01aSSasha Levin 	if (sdl && fb) {
12913f838fecSPekka Enberg 		sdl__init(fb);
129248d9e01aSSasha Levin 		if (r < 0) {
129348d9e01aSSasha Levin 			pr_err("sdl__init() failed with error %d\n", r);
129448d9e01aSSasha Levin 			goto fail;
129548d9e01aSSasha Levin 		}
12963f838fecSPekka Enberg 	}
1297aba1efa5SPekka Enberg 
129848d9e01aSSasha Levin 	r = fb__start();
129948d9e01aSSasha Levin 	if (r < 0) {
130048d9e01aSSasha Levin 		pr_err("fb__init() failed with error %d\n", r);
130148d9e01aSSasha Levin 		goto fail;
130248d9e01aSSasha Levin 	}
1303aba1efa5SPekka Enberg 
130425af47eeSMatt Evans 	/* Device init all done; firmware init must
130525af47eeSMatt Evans 	 * come after this (it may set up device trees etc.)
130625af47eeSMatt Evans 	 */
130725af47eeSMatt Evans 
130825af47eeSMatt Evans 	kvm__start_timer(kvm);
130925af47eeSMatt Evans 
13105ad8db5eSPekka Enberg 	if (firmware_filename) {
13115ad8db5eSPekka Enberg 		if (!kvm__load_firmware(kvm, firmware_filename))
13125ad8db5eSPekka Enberg 			die("unable to load firmware image %s: %s", firmware_filename, strerror(errno));
13135ad8db5eSPekka Enberg 	} else {
1314e1e46fe6SSasha Levin 		kvm__arch_setup_firmware(kvm);
13151add9f73SSasha Levin 		if (r < 0) {
13161add9f73SSasha Levin 			pr_err("kvm__arch_setup_firmware() failed with error %d\n", r);
13171add9f73SSasha Levin 			goto fail;
13181add9f73SSasha Levin 		}
13195ad8db5eSPekka Enberg 	}
132025af47eeSMatt Evans 
132125af47eeSMatt Evans 	for (i = 0; i < nrcpus; i++) {
132225af47eeSMatt Evans 		kvm_cpus[i] = kvm_cpu__init(kvm, i);
132325af47eeSMatt Evans 		if (!kvm_cpus[i])
132425af47eeSMatt Evans 			die("unable to initialize KVM VCPU");
132525af47eeSMatt Evans 	}
132625af47eeSMatt Evans 
1327d60bafe5SSasha Levin 	thread_pool__init(nr_online_cpus);
13284932d174SSasha Levin fail:
13294932d174SSasha Levin 	return r;
1330e1e46fe6SSasha Levin }
1331e1e46fe6SSasha Levin 
1332e1e46fe6SSasha Levin static int kvm_cmd_run_work(void)
1333e1e46fe6SSasha Levin {
1334e1e46fe6SSasha Levin 	int i, r = -1;
1335e1e46fe6SSasha Levin 	void *ret = NULL;
1336e1e46fe6SSasha Levin 
1337839051d9SSasha Levin 	for (i = 0; i < nrcpus; i++) {
1338d77a9efaSCyrill Gorcunov 		if (pthread_create(&kvm_cpus[i]->thread, NULL, kvm_cpu_thread, kvm_cpus[i]) != 0)
13395ee154d1SPekka Enberg 			die("unable to create KVM VCPU thread");
13405ee154d1SPekka Enberg 	}
13415ee154d1SPekka Enberg 
134249e5227dSSasha Levin 	/* Only VCPU #0 is going to exit by itself when shutting down */
134349e5227dSSasha Levin 	if (pthread_join(kvm_cpus[0]->thread, &ret) != 0)
1344e1e46fe6SSasha Levin 		r = 0;
13455ee154d1SPekka Enberg 
134689e0575aSPekka Enberg 	kvm_cpu__delete(kvm_cpus[0]);
134720715a22SSasha Levin 	kvm_cpus[0] = NULL;
134889e0575aSPekka Enberg 
134949e5227dSSasha Levin 	for (i = 1; i < nrcpus; i++) {
1350c23d9748SSasha Levin 		if (kvm_cpus[i]->is_running) {
135149e5227dSSasha Levin 			pthread_kill(kvm_cpus[i]->thread, SIGKVMEXIT);
1352d77a9efaSCyrill Gorcunov 			if (pthread_join(kvm_cpus[i]->thread, &ret) != 0)
13535ee154d1SPekka Enberg 				die("pthread_join");
135489e0575aSPekka Enberg 			kvm_cpu__delete(kvm_cpus[i]);
1355c23d9748SSasha Levin 		}
1356e1e46fe6SSasha Levin 		if (ret == NULL)
1357e1e46fe6SSasha Levin 			r = 0;
13585ee154d1SPekka Enberg 	}
1359f967c427SPrasad Joshi 
1360e1e46fe6SSasha Levin 	return r;
1361e1e46fe6SSasha Levin }
1362e1e46fe6SSasha Levin 
13634932d174SSasha Levin static void kvm_cmd_run_exit(int guest_ret)
1364e1e46fe6SSasha Levin {
13654932d174SSasha Levin 	int r = 0;
13664932d174SSasha Levin 
1367e6694207SSasha Levin 	compat__print_all_messages();
1368e6694207SSasha Levin 
1369807b77b9SCyrill Gorcunov 	r = symbol_exit(kvm);
13704932d174SSasha Levin 	if (r < 0)
1371807b77b9SCyrill Gorcunov 		pr_warning("symbol_exit() failed with error %d\n", r);
13724932d174SSasha Levin 
1373e3c4f8aaSSasha Levin 	r = irq__exit(kvm);
1374e3c4f8aaSSasha Levin 	if (r < 0)
1375e3c4f8aaSSasha Levin 		pr_warning("irq__exit() failed with error %d\n", r);
1376e3c4f8aaSSasha Levin 
1377aba1efa5SPekka Enberg 	fb__stop();
1378aba1efa5SPekka Enberg 
1379a67da3beSAsias He 	r = virtio_scsi_exit(kvm);
1380a67da3beSAsias He 	if (r < 0)
1381a67da3beSAsias He 		pr_warning("virtio_scsi_exit() failed with error %d\n", r);
1382a67da3beSAsias He 
13839f9207c5SSasha Levin 	r = virtio_blk__exit(kvm);
13849f9207c5SSasha Levin 	if (r < 0)
13859f9207c5SSasha Levin 		pr_warning("virtio_blk__exit() failed with error %d\n", r);
13869f9207c5SSasha Levin 
1387495fbd4eSSasha Levin 	r = virtio_rng__exit(kvm);
1388495fbd4eSSasha Levin 	if (r < 0)
1389495fbd4eSSasha Levin 		pr_warning("virtio_rng__exit() failed with error %d\n", r);
1390a0a1e3c2SPrasad Joshi 
13919f9207c5SSasha Levin 	r = disk_image__close_all(kvm->disks, image_count);
13929f9207c5SSasha Levin 	if (r < 0)
13939f9207c5SSasha Levin 		pr_warning("disk_image__close_all() failed with error %d\n", r);
13947af40b91SSasha Levin 
139520715a22SSasha Levin 	r = serial8250__exit(kvm);
139620715a22SSasha Levin 	if (r < 0)
139720715a22SSasha Levin 		pr_warning("serial8250__exit() failed with error %d\n", r);
139820715a22SSasha Levin 
139920c39545SSasha Levin 	r = rtc__exit(kvm);
140020c39545SSasha Levin 	if (r < 0)
140120c39545SSasha Levin 		pr_warning("rtc__exit() failed with error %d\n", r);
140220c39545SSasha Levin 
14031add9f73SSasha Levin 	r = kvm__arch_free_firmware(kvm);
14041add9f73SSasha Levin 	if (r < 0)
14051add9f73SSasha Levin 		pr_warning("kvm__arch_free_firmware() failed with error %d\n", r);
14061add9f73SSasha Levin 
14077af40b91SSasha Levin 	r = ioport__exit(kvm);
14087af40b91SSasha Levin 	if (r < 0)
14097af40b91SSasha Levin 		pr_warning("ioport__exit() failed with error %d\n", r);
14107af40b91SSasha Levin 
1411ea6eeb1cSSasha Levin 	r = ioeventfd__exit(kvm);
1412ea6eeb1cSSasha Levin 	if (r < 0)
1413ea6eeb1cSSasha Levin 		pr_warning("ioeventfd__exit() failed with error %d\n", r);
1414ea6eeb1cSSasha Levin 
14156d987703SSasha Levin 	r = pci__exit(kvm);
14166d987703SSasha Levin 	if (r < 0)
14176d987703SSasha Levin 		pr_warning("pci__exit() failed with error %d\n", r);
14186d987703SSasha Levin 
1419495fbd4eSSasha Levin 	r = kvm__exit(kvm);
1420495fbd4eSSasha Levin 	if (r < 0)
1421495fbd4eSSasha Levin 		pr_warning("pci__exit() failed with error %d\n", r);
1422f967c427SPrasad Joshi 
142349777800SPekka Enberg 	free(kvm_cpus);
142449777800SPekka Enberg 
1425e1e46fe6SSasha Levin 	if (guest_ret == 0)
1426f967c427SPrasad Joshi 		printf("\n  # KVM session ended normally.\n");
1427e1e46fe6SSasha Levin }
1428e1e46fe6SSasha Levin 
1429e1e46fe6SSasha Levin int kvm_cmd_run(int argc, const char **argv, const char *prefix)
1430e1e46fe6SSasha Levin {
14314932d174SSasha Levin 	int r, ret = -EFAULT;
1432e1e46fe6SSasha Levin 
1433e1e46fe6SSasha Levin 	r = kvm_cmd_run_init(argc, argv);
1434e1e46fe6SSasha Levin 	if (r < 0)
1435e1e46fe6SSasha Levin 		return r;
1436e1e46fe6SSasha Levin 
1437e1e46fe6SSasha Levin 	ret = kvm_cmd_run_work();
1438e1e46fe6SSasha Levin 	kvm_cmd_run_exit(ret);
1439e1e46fe6SSasha Levin 
1440e1e46fe6SSasha Levin 	return ret;
1441f967c427SPrasad Joshi }
1442