xref: /kvmtool/builtin-run.c (revision 69f50425bd17e458c17942fa4189020dd309cd7b)
1ece09f8fSPekka Enberg #include "kvm/builtin-run.h"
2ece09f8fSPekka Enberg 
3c8675741SSasha Levin #include "kvm/builtin-setup.h"
4ece09f8fSPekka Enberg #include "kvm/virtio-balloon.h"
5ece09f8fSPekka Enberg #include "kvm/virtio-console.h"
6ece09f8fSPekka Enberg #include "kvm/parse-options.h"
7ece09f8fSPekka Enberg #include "kvm/8250-serial.h"
8ece09f8fSPekka Enberg #include "kvm/framebuffer.h"
9ece09f8fSPekka Enberg #include "kvm/disk-image.h"
10ece09f8fSPekka Enberg #include "kvm/threadpool.h"
11a67da3beSAsias He #include "kvm/virtio-scsi.h"
12ece09f8fSPekka Enberg #include "kvm/virtio-blk.h"
13ece09f8fSPekka Enberg #include "kvm/virtio-net.h"
14ece09f8fSPekka Enberg #include "kvm/virtio-rng.h"
15ece09f8fSPekka Enberg #include "kvm/ioeventfd.h"
16ece09f8fSPekka Enberg #include "kvm/virtio-9p.h"
17ece09f8fSPekka Enberg #include "kvm/barrier.h"
18ece09f8fSPekka Enberg #include "kvm/kvm-cpu.h"
19ece09f8fSPekka Enberg #include "kvm/ioport.h"
20ece09f8fSPekka Enberg #include "kvm/symbol.h"
21ece09f8fSPekka Enberg #include "kvm/i8042.h"
22ece09f8fSPekka Enberg #include "kvm/mutex.h"
23ece09f8fSPekka Enberg #include "kvm/term.h"
24ece09f8fSPekka Enberg #include "kvm/util.h"
25ec52d504SLai Jiangshan #include "kvm/strbuf.h"
26ece09f8fSPekka Enberg #include "kvm/vesa.h"
27ece09f8fSPekka Enberg #include "kvm/irq.h"
28ece09f8fSPekka Enberg #include "kvm/kvm.h"
29ece09f8fSPekka Enberg #include "kvm/pci.h"
30ece09f8fSPekka Enberg #include "kvm/rtc.h"
31ece09f8fSPekka Enberg #include "kvm/sdl.h"
32ece09f8fSPekka Enberg #include "kvm/vnc.h"
33e6694207SSasha Levin #include "kvm/guest_compat.h"
3495d13a52SSasha Levin #include "kvm/pci-shmem.h"
354b1addaeSSasha Levin #include "kvm/kvm-ipc.h"
364b1c6f6eSSasha Levin #include "kvm/builtin-debug.h"
37ece09f8fSPekka Enberg 
38ece09f8fSPekka Enberg #include <linux/types.h>
3948d9e01aSSasha Levin #include <linux/err.h>
40ece09f8fSPekka Enberg 
418329f30bSPekka Enberg #include <sys/utsname.h>
428329f30bSPekka Enberg #include <sys/types.h>
438329f30bSPekka Enberg #include <sys/stat.h>
44ece09f8fSPekka Enberg #include <termios.h>
45ece09f8fSPekka Enberg #include <signal.h>
46ece09f8fSPekka Enberg #include <stdlib.h>
47ece09f8fSPekka Enberg #include <string.h>
48ece09f8fSPekka Enberg #include <unistd.h>
4926c853e4SPrasad Joshi #include <ctype.h>
50ece09f8fSPekka Enberg #include <stdio.h>
51f967c427SPrasad Joshi 
52f967c427SPrasad Joshi #define MB_SHIFT		(20)
5395d13a52SSasha Levin #define KB_SHIFT		(10)
5495d13a52SSasha Levin #define GB_SHIFT		(30)
55f967c427SPrasad Joshi 
56656be1b8SSasha Levin __thread struct kvm_cpu *current_kvm_cpu;
57f967c427SPrasad Joshi 
583c29e2aaSSasha Levin static int  kvm_run_wrapper;
59f967c427SPrasad Joshi 
60ed036f03SCyrill Gorcunov bool do_debug_print = false;
61ed036f03SCyrill Gorcunov 
62afc2c7c0SAsias He extern char _binary_guest_init_start;
63afc2c7c0SAsias He extern char _binary_guest_init_size;
64afc2c7c0SAsias He 
65f967c427SPrasad Joshi static const char * const run_usage[] = {
668d2ff5daSWanlong Gao 	"lkvm run [<options>] [<kernel image>]",
67f967c427SPrasad Joshi 	NULL
68f967c427SPrasad Joshi };
69f967c427SPrasad Joshi 
703c29e2aaSSasha Levin enum {
71e0747665SSasha Levin 	KVM_RUN_DEFAULT,
723c29e2aaSSasha Levin 	KVM_RUN_SANDBOX,
733c29e2aaSSasha Levin };
743c29e2aaSSasha Levin 
75a33979d8SSasha Levin static int img_name_parser(const struct option *opt, const char *arg, int unset)
76a33979d8SSasha Levin {
7782d65b5eSSasha Levin 	char path[PATH_MAX];
785236b505SAsias He 	struct stat st;
79a33979d8SSasha Levin 
809667701cSPekka Enberg 	snprintf(path, PATH_MAX, "%s%s", kvm__get_dir(), arg);
8182d65b5eSSasha Levin 
82cac9e8fdSSasha Levin 	if ((stat(arg, &st) == 0 && S_ISDIR(st.st_mode)) ||
83cac9e8fdSSasha Levin 	   (stat(path, &st) == 0 && S_ISDIR(st.st_mode)))
84cac9e8fdSSasha Levin 		return virtio_9p_img_name_parser(opt, arg, unset);
853b55dcdeSSasha Levin 	return disk_img_name_parser(opt, arg, unset);
86a67da3beSAsias He }
87a67da3beSAsias He 
883b55dcdeSSasha Levin void kvm_run_set_wrapper_sandbox(void)
893b55dcdeSSasha Levin {
903b55dcdeSSasha Levin 	kvm_run_wrapper = KVM_RUN_SANDBOX;
91a33979d8SSasha Levin }
92a33979d8SSasha Levin 
93ff7ba6faSWill Deacon #ifndef OPT_ARCH_RUN
94ff7ba6faSWill Deacon #define OPT_ARCH_RUN(...)
95ff7ba6faSWill Deacon #endif
96ff7ba6faSWill Deacon 
973b55dcdeSSasha Levin #define BUILD_OPTIONS(name, cfg, kvm)					\
98b816364aSSasha Levin 	struct option name[] = {					\
99b816364aSSasha Levin 	OPT_GROUP("Basic options:"),					\
100b816364aSSasha Levin 	OPT_STRING('\0', "name", &(cfg)->guest_name, "guest name",	\
101b816364aSSasha Levin 			"A name for the guest"),			\
10200ebbe96SSasha Levin 	OPT_INTEGER('c', "cpus", &(cfg)->nrcpus, "Number of CPUs"),	\
103b5e56fa3SWilliam Dauchy 	OPT_U64('m', "mem", &(cfg)->ram_size, "Virtual machine memory"	\
104b5e56fa3SWilliam Dauchy 		" size in MiB."),					\
105b816364aSSasha Levin 	OPT_CALLBACK('\0', "shmem", NULL,				\
106b816364aSSasha Levin 		     "[pci:]<addr>:<size>[:handle=<handle>][:create]",	\
107b816364aSSasha Levin 		     "Share host shmem with guest via pci device",	\
1081dc24dccSSasha Levin 		     shmem_parser, NULL),				\
109b5e56fa3SWilliam Dauchy 	OPT_CALLBACK('d', "disk", kvm, "image or rootfs_dir", "Disk "	\
110b5e56fa3SWilliam Dauchy 			" image or rootfs directory", img_name_parser,	\
1113b55dcdeSSasha Levin 			kvm),						\
112b5e56fa3SWilliam Dauchy 	OPT_BOOLEAN('\0', "balloon", &(cfg)->balloon, "Enable virtio"	\
113b5e56fa3SWilliam Dauchy 			" balloon"),					\
114b816364aSSasha Levin 	OPT_BOOLEAN('\0', "vnc", &(cfg)->vnc, "Enable VNC framebuffer"),\
1157bcceb95SPekka Enberg 	OPT_BOOLEAN('\0', "gtk", &(cfg)->gtk, "Enable GTK framebuffer"),\
116b816364aSSasha Levin 	OPT_BOOLEAN('\0', "sdl", &(cfg)->sdl, "Enable SDL framebuffer"),\
117b5e56fa3SWilliam Dauchy 	OPT_BOOLEAN('\0', "rng", &(cfg)->virtio_rng, "Enable virtio"	\
118b5e56fa3SWilliam Dauchy 			" Random Number Generator"),			\
119b816364aSSasha Levin 	OPT_CALLBACK('\0', "9p", NULL, "dir_to_share,tag_name",		\
120b5e56fa3SWilliam Dauchy 		     "Enable virtio 9p to share files between host and"	\
121b5e56fa3SWilliam Dauchy 		     " guest", virtio_9p_rootdir_parser, kvm),		\
122b5e56fa3SWilliam Dauchy 	OPT_STRING('\0', "console", &(cfg)->console, "serial, virtio or"\
123b5e56fa3SWilliam Dauchy 			" hv", "Console to use"),			\
124b816364aSSasha Levin 	OPT_STRING('\0', "dev", &(cfg)->dev, "device_file",		\
125b816364aSSasha Levin 			"KVM device file"),				\
126b816364aSSasha Levin 	OPT_CALLBACK('\0', "tty", NULL, "tty id",			\
127b816364aSSasha Levin 		     "Remap guest TTY into a pty on the host",		\
1281dc24dccSSasha Levin 		     tty_parser, NULL),					\
129b816364aSSasha Levin 	OPT_STRING('\0', "sandbox", &(cfg)->sandbox, "script",		\
130b5e56fa3SWilliam Dauchy 			"Run this script when booting into custom"	\
131b5e56fa3SWilliam Dauchy 			" rootfs"),					\
132b816364aSSasha Levin 	OPT_STRING('\0', "hugetlbfs", &(cfg)->hugetlbfs_path, "path",	\
133b816364aSSasha Levin 			"Hugetlbfs path"),				\
134b816364aSSasha Levin 									\
135b816364aSSasha Levin 	OPT_GROUP("Kernel options:"),					\
136b816364aSSasha Levin 	OPT_STRING('k', "kernel", &(cfg)->kernel_filename, "kernel",	\
137b816364aSSasha Levin 			"Kernel to boot in virtual machine"),		\
138b816364aSSasha Levin 	OPT_STRING('i', "initrd", &(cfg)->initrd_filename, "initrd",	\
139b816364aSSasha Levin 			"Initial RAM disk image"),			\
140b816364aSSasha Levin 	OPT_STRING('p', "params", &(cfg)->kernel_cmdline, "params",	\
141b816364aSSasha Levin 			"Kernel command line arguments"),		\
142b816364aSSasha Levin 	OPT_STRING('f', "firmware", &(cfg)->firmware_filename, "firmware",\
143b816364aSSasha Levin 			"Firmware image to boot in virtual machine"),	\
144b816364aSSasha Levin 									\
145b816364aSSasha Levin 	OPT_GROUP("Networking options:"),				\
146b816364aSSasha Levin 	OPT_CALLBACK_DEFAULT('n', "network", NULL, "network params",	\
147b816364aSSasha Levin 		     "Create a new guest NIC",				\
1485f225124SSasha Levin 		     netdev_parser, NULL, kvm),				\
149b5e56fa3SWilliam Dauchy 	OPT_BOOLEAN('\0', "no-dhcp", &(cfg)->no_dhcp, "Disable kernel"	\
150b5e56fa3SWilliam Dauchy 			" DHCP in rootfs mode"),			\
151b816364aSSasha Levin 									\
152b816364aSSasha Levin 	OPT_GROUP("Debug options:"),					\
153b816364aSSasha Levin 	OPT_BOOLEAN('\0', "debug", &do_debug_print,			\
154b816364aSSasha Levin 			"Enable debug messages"),			\
155b816364aSSasha Levin 	OPT_BOOLEAN('\0', "debug-single-step", &(cfg)->single_step,	\
156b816364aSSasha Levin 			"Enable single stepping"),			\
1575765977dSSasha Levin 	OPT_BOOLEAN('\0', "debug-ioport", &(cfg)->ioport_debug,		\
158b816364aSSasha Levin 			"Enable ioport debugging"),			\
159e830cce7SSasha Levin 	OPT_BOOLEAN('\0', "debug-mmio", &(cfg)->mmio_debug,		\
160b816364aSSasha Levin 			"Enable MMIO debugging"),			\
1613b55dcdeSSasha Levin 	OPT_INTEGER('\0', "debug-iodelay", &(cfg)->debug_iodelay,	\
162b816364aSSasha Levin 			"Delay IO by millisecond"),			\
163ff7ba6faSWill Deacon 									\
164ff7ba6faSWill Deacon 	OPT_ARCH(RUN, cfg)						\
165b816364aSSasha Levin 	OPT_END()							\
166f967c427SPrasad Joshi 	};
167f967c427SPrasad Joshi 
1685ee154d1SPekka Enberg static void *kvm_cpu_thread(void *arg)
1695ee154d1SPekka Enberg {
170a4d8c55eSSasha Levin 	char name[16];
171a4d8c55eSSasha Levin 
172d77a9efaSCyrill Gorcunov 	current_kvm_cpu = arg;
1735ee154d1SPekka Enberg 
174a4d8c55eSSasha Levin 	sprintf(name, "kvm-vcpu-%lu", current_kvm_cpu->cpu_id);
175a4d8c55eSSasha Levin 	kvm__set_thread_name(name);
176a4d8c55eSSasha Levin 
177d77a9efaSCyrill Gorcunov 	if (kvm_cpu__start(current_kvm_cpu))
1785ee154d1SPekka Enberg 		goto panic_kvm;
1795ee154d1SPekka Enberg 
1805ee154d1SPekka Enberg 	return (void *) (intptr_t) 0;
1815ee154d1SPekka Enberg 
1825ee154d1SPekka Enberg panic_kvm:
1833fdf659dSSasha Levin 	fprintf(stderr, "KVM exit reason: %u (\"%s\")\n",
184d77a9efaSCyrill Gorcunov 		current_kvm_cpu->kvm_run->exit_reason,
185d77a9efaSCyrill Gorcunov 		kvm_exit_reasons[current_kvm_cpu->kvm_run->exit_reason]);
186d77a9efaSCyrill Gorcunov 	if (current_kvm_cpu->kvm_run->exit_reason == KVM_EXIT_UNKNOWN)
187*69f50425SAndreas Herrmann 		fprintf(stderr, "KVM exit code: 0x%llu\n",
188*69f50425SAndreas Herrmann 			(unsigned long long)current_kvm_cpu->kvm_run->hw.hardware_exit_reason);
1898e5accedSPekka Enberg 
190b7d2f013SSasha Levin 	kvm_cpu__set_debug_fd(STDOUT_FILENO);
191d77a9efaSCyrill Gorcunov 	kvm_cpu__show_registers(current_kvm_cpu);
192d77a9efaSCyrill Gorcunov 	kvm_cpu__show_code(current_kvm_cpu);
193d77a9efaSCyrill Gorcunov 	kvm_cpu__show_page_tables(current_kvm_cpu);
1945ee154d1SPekka Enberg 
1955ee154d1SPekka Enberg 	return (void *) (intptr_t) 1;
1965ee154d1SPekka Enberg }
1975ee154d1SPekka Enberg 
198e08c0896SPrasad Joshi static char kernel[PATH_MAX];
199b0b42ba0SPekka Enberg 
200b0b42ba0SPekka Enberg static const char *host_kernels[] = {
201e08c0896SPrasad Joshi 	"/boot/vmlinuz",
202e08c0896SPrasad Joshi 	"/boot/bzImage",
203e08c0896SPrasad Joshi 	NULL
204e08c0896SPrasad Joshi };
205b0b42ba0SPekka Enberg 
206b0b42ba0SPekka Enberg static const char *default_kernels[] = {
207e08c0896SPrasad Joshi 	"./bzImage",
208b03af790SKonstantin Khlebnikov 	"arch/" BUILD_ARCH "/boot/bzImage",
209af7b0868SMatt Evans 	"../../arch/" BUILD_ARCH "/boot/bzImage",
210e08c0896SPrasad Joshi 	NULL
211e08c0896SPrasad Joshi };
2128329f30bSPekka Enberg 
213b0b42ba0SPekka Enberg static const char *default_vmlinux[] = {
214b03af790SKonstantin Khlebnikov 	"vmlinux",
215b0b42ba0SPekka Enberg 	"../../../vmlinux",
216b0b42ba0SPekka Enberg 	"../../vmlinux",
217b0b42ba0SPekka Enberg 	NULL
218b0b42ba0SPekka Enberg };
219b0b42ba0SPekka Enberg 
220e08c0896SPrasad Joshi static void kernel_usage_with_options(void)
2218329f30bSPekka Enberg {
222e08c0896SPrasad Joshi 	const char **k;
2238329f30bSPekka Enberg 	struct utsname uts;
224e08c0896SPrasad Joshi 
225e08c0896SPrasad Joshi 	fprintf(stderr, "Fatal: could not find default kernel image in:\n");
22665182f37SPrasad Joshi 	k = &default_kernels[0];
227e08c0896SPrasad Joshi 	while (*k) {
228e08c0896SPrasad Joshi 		fprintf(stderr, "\t%s\n", *k);
229e08c0896SPrasad Joshi 		k++;
230e08c0896SPrasad Joshi 	}
231e08c0896SPrasad Joshi 
232e08c0896SPrasad Joshi 	if (uname(&uts) < 0)
233e08c0896SPrasad Joshi 		return;
234e08c0896SPrasad Joshi 
235e08c0896SPrasad Joshi 	k = &host_kernels[0];
236e08c0896SPrasad Joshi 	while (*k) {
237e08c0896SPrasad Joshi 		if (snprintf(kernel, PATH_MAX, "%s-%s", *k, uts.release) < 0)
238e08c0896SPrasad Joshi 			return;
239e08c0896SPrasad Joshi 		fprintf(stderr, "\t%s\n", kernel);
240e08c0896SPrasad Joshi 		k++;
241e08c0896SPrasad Joshi 	}
242ee8b1456SWanlong Gao 	fprintf(stderr, "\nPlease see '%s run --help' for more options.\n\n",
243ee8b1456SWanlong Gao 		KVM_BINARY_NAME);
244e08c0896SPrasad Joshi }
245e08c0896SPrasad Joshi 
24660ded003SPekka Enberg static u64 host_ram_size(void)
24760ded003SPekka Enberg {
24860ded003SPekka Enberg 	long page_size;
24960ded003SPekka Enberg 	long nr_pages;
25060ded003SPekka Enberg 
25160ded003SPekka Enberg 	nr_pages	= sysconf(_SC_PHYS_PAGES);
252d63c5ce6SPekka Enberg 	if (nr_pages < 0) {
2534542f276SCyrill Gorcunov 		pr_warning("sysconf(_SC_PHYS_PAGES) failed");
254d63c5ce6SPekka Enberg 		return 0;
255d63c5ce6SPekka Enberg 	}
25660ded003SPekka Enberg 
25760ded003SPekka Enberg 	page_size	= sysconf(_SC_PAGE_SIZE);
258d63c5ce6SPekka Enberg 	if (page_size < 0) {
2594542f276SCyrill Gorcunov 		pr_warning("sysconf(_SC_PAGE_SIZE) failed");
260d63c5ce6SPekka Enberg 		return 0;
261d63c5ce6SPekka Enberg 	}
26260ded003SPekka Enberg 
26360ded003SPekka Enberg 	return (nr_pages * page_size) >> MB_SHIFT;
26460ded003SPekka Enberg }
26560ded003SPekka Enberg 
26618bd8c3bSPekka Enberg /*
26718bd8c3bSPekka Enberg  * If user didn't specify how much memory it wants to allocate for the guest,
26818bd8c3bSPekka Enberg  * avoid filling the whole host RAM.
26918bd8c3bSPekka Enberg  */
27018bd8c3bSPekka Enberg #define RAM_SIZE_RATIO		0.8
27118bd8c3bSPekka Enberg 
272fd834defSPekka Enberg static u64 get_ram_size(int nr_cpus)
273fd834defSPekka Enberg {
27406761c76SPekka Enberg 	u64 available;
27506761c76SPekka Enberg 	u64 ram_size;
276fd834defSPekka Enberg 
277fd834defSPekka Enberg 	ram_size	= 64 * (nr_cpus + 3);
278fd834defSPekka Enberg 
27960ded003SPekka Enberg 	available	= host_ram_size() * RAM_SIZE_RATIO;
280d63c5ce6SPekka Enberg 	if (!available)
281d63c5ce6SPekka Enberg 		available = MIN_RAM_SIZE_MB;
282fd834defSPekka Enberg 
283fd834defSPekka Enberg 	if (ram_size > available)
284fd834defSPekka Enberg 		ram_size	= available;
285fd834defSPekka Enberg 
286fd834defSPekka Enberg 	return ram_size;
287fd834defSPekka Enberg }
288fd834defSPekka Enberg 
289e08c0896SPrasad Joshi static const char *find_kernel(void)
290e08c0896SPrasad Joshi {
291e08c0896SPrasad Joshi 	const char **k;
2928329f30bSPekka Enberg 	struct stat st;
293e08c0896SPrasad Joshi 	struct utsname uts;
294e08c0896SPrasad Joshi 
29565182f37SPrasad Joshi 	k = &default_kernels[0];
296e08c0896SPrasad Joshi 	while (*k) {
297e08c0896SPrasad Joshi 		if (stat(*k, &st) < 0 || !S_ISREG(st.st_mode)) {
298e08c0896SPrasad Joshi 			k++;
299e08c0896SPrasad Joshi 			continue;
300e08c0896SPrasad Joshi 		}
301e08c0896SPrasad Joshi 		strncpy(kernel, *k, PATH_MAX);
302e08c0896SPrasad Joshi 		return kernel;
303e08c0896SPrasad Joshi 	}
3048329f30bSPekka Enberg 
3058329f30bSPekka Enberg 	if (uname(&uts) < 0)
3068329f30bSPekka Enberg 		return NULL;
3078329f30bSPekka Enberg 
308e08c0896SPrasad Joshi 	k = &host_kernels[0];
309e08c0896SPrasad Joshi 	while (*k) {
310e08c0896SPrasad Joshi 		if (snprintf(kernel, PATH_MAX, "%s-%s", *k, uts.release) < 0)
3118329f30bSPekka Enberg 			return NULL;
3128329f30bSPekka Enberg 
313e08c0896SPrasad Joshi 		if (stat(kernel, &st) < 0 || !S_ISREG(st.st_mode)) {
314e08c0896SPrasad Joshi 			k++;
315e08c0896SPrasad Joshi 			continue;
316e08c0896SPrasad Joshi 		}
317e08c0896SPrasad Joshi 		return kernel;
3188329f30bSPekka Enberg 
319e08c0896SPrasad Joshi 	}
3208329f30bSPekka Enberg 	return NULL;
3218329f30bSPekka Enberg }
3228329f30bSPekka Enberg 
323b0b42ba0SPekka Enberg static const char *find_vmlinux(void)
324b0b42ba0SPekka Enberg {
325b0b42ba0SPekka Enberg 	const char **vmlinux;
326b0b42ba0SPekka Enberg 
327b0b42ba0SPekka Enberg 	vmlinux = &default_vmlinux[0];
328b0b42ba0SPekka Enberg 	while (*vmlinux) {
329b0b42ba0SPekka Enberg 		struct stat st;
330b0b42ba0SPekka Enberg 
331b0b42ba0SPekka Enberg 		if (stat(*vmlinux, &st) < 0 || !S_ISREG(st.st_mode)) {
332b0b42ba0SPekka Enberg 			vmlinux++;
333b0b42ba0SPekka Enberg 			continue;
334b0b42ba0SPekka Enberg 		}
335b0b42ba0SPekka Enberg 		return *vmlinux;
336b0b42ba0SPekka Enberg 	}
337b0b42ba0SPekka Enberg 	return NULL;
338b0b42ba0SPekka Enberg }
339b0b42ba0SPekka Enberg 
340f6677a1dSAmerigo Wang void kvm_run_help(void)
341f6677a1dSAmerigo Wang {
3424346fd8fSSasha Levin 	struct kvm *kvm = NULL;
3434346fd8fSSasha Levin 
3443b55dcdeSSasha Levin 	BUILD_OPTIONS(options, &kvm->cfg, kvm);
345f6677a1dSAmerigo Wang 	usage_with_options(run_usage, options);
346f6677a1dSAmerigo Wang }
347f6677a1dSAmerigo Wang 
3484346fd8fSSasha Levin static int kvm_setup_guest_init(struct kvm *kvm)
3499cec19c8SSasha Levin {
35047621338SSasha Levin 	const char *rootfs = kvm->cfg.custom_rootfs_name;
351afc2c7c0SAsias He 	char tmp[PATH_MAX];
352afc2c7c0SAsias He 	size_t size;
353afc2c7c0SAsias He 	int fd, ret;
354afc2c7c0SAsias He 	char *data;
3559cec19c8SSasha Levin 
356afc2c7c0SAsias He 	/* Setup /virt/init */
357afc2c7c0SAsias He 	size = (size_t)&_binary_guest_init_size;
358afc2c7c0SAsias He 	data = (char *)&_binary_guest_init_start;
359afc2c7c0SAsias He 	snprintf(tmp, PATH_MAX, "%s%s/virt/init", kvm__get_dir(), rootfs);
360afc2c7c0SAsias He 	remove(tmp);
361afc2c7c0SAsias He 	fd = open(tmp, O_CREAT | O_WRONLY, 0755);
362afc2c7c0SAsias He 	if (fd < 0)
363afc2c7c0SAsias He 		die("Fail to setup %s", tmp);
364afc2c7c0SAsias He 	ret = xwrite(fd, data, size);
365afc2c7c0SAsias He 	if (ret < 0)
366afc2c7c0SAsias He 		die("Fail to setup %s", tmp);
367afc2c7c0SAsias He 	close(fd);
3689cec19c8SSasha Levin 
369afc2c7c0SAsias He 	return 0;
3709cec19c8SSasha Levin }
3719cec19c8SSasha Levin 
3724346fd8fSSasha Levin static int kvm_run_set_sandbox(struct kvm *kvm)
373d50fe489SSasha Levin {
37447621338SSasha Levin 	const char *guestfs_name = kvm->cfg.custom_rootfs_name;
375d50fe489SSasha Levin 	char path[PATH_MAX], script[PATH_MAX], *tmp;
376d50fe489SSasha Levin 
377d50fe489SSasha Levin 	snprintf(path, PATH_MAX, "%s%s/virt/sandbox.sh", kvm__get_dir(), guestfs_name);
378d50fe489SSasha Levin 
379d50fe489SSasha Levin 	remove(path);
380d50fe489SSasha Levin 
38147621338SSasha Levin 	if (kvm->cfg.sandbox == NULL)
382d50fe489SSasha Levin 		return 0;
383d50fe489SSasha Levin 
38447621338SSasha Levin 	tmp = realpath(kvm->cfg.sandbox, NULL);
385d50fe489SSasha Levin 	if (tmp == NULL)
386d50fe489SSasha Levin 		return -ENOMEM;
387d50fe489SSasha Levin 
388d50fe489SSasha Levin 	snprintf(script, PATH_MAX, "/host/%s", tmp);
389d50fe489SSasha Levin 	free(tmp);
390d50fe489SSasha Levin 
391d50fe489SSasha Levin 	return symlink(script, path);
392d50fe489SSasha Levin }
393d50fe489SSasha Levin 
3945173b4afSLai Jiangshan static void kvm_write_sandbox_cmd_exactly(int fd, const char *arg)
3955173b4afSLai Jiangshan {
3965173b4afSLai Jiangshan 	const char *single_quote;
3975173b4afSLai Jiangshan 
3985173b4afSLai Jiangshan 	if (!*arg) { /* zero length string */
3995173b4afSLai Jiangshan 		if (write(fd, "''", 2) <= 0)
4005173b4afSLai Jiangshan 			die("Failed writing sandbox script");
4015173b4afSLai Jiangshan 		return;
4025173b4afSLai Jiangshan 	}
4035173b4afSLai Jiangshan 
4045173b4afSLai Jiangshan 	while (*arg) {
4055173b4afSLai Jiangshan 		single_quote = strchrnul(arg, '\'');
4065173b4afSLai Jiangshan 
4075173b4afSLai Jiangshan 		/* write non-single-quote string as #('string') */
4085173b4afSLai Jiangshan 		if (arg != single_quote) {
4095173b4afSLai Jiangshan 			if (write(fd, "'", 1) <= 0 ||
4105173b4afSLai Jiangshan 			    write(fd, arg, single_quote - arg) <= 0 ||
4115173b4afSLai Jiangshan 			    write(fd, "'", 1) <= 0)
4125173b4afSLai Jiangshan 				die("Failed writing sandbox script");
4135173b4afSLai Jiangshan 		}
4145173b4afSLai Jiangshan 
4155173b4afSLai Jiangshan 		/* write single quote as #("'") */
4165173b4afSLai Jiangshan 		if (*single_quote) {
4175173b4afSLai Jiangshan 			if (write(fd, "\"'\"", 3) <= 0)
4185173b4afSLai Jiangshan 				die("Failed writing sandbox script");
4195173b4afSLai Jiangshan 		} else
4205173b4afSLai Jiangshan 			break;
4215173b4afSLai Jiangshan 
4225173b4afSLai Jiangshan 		arg = single_quote + 1;
4235173b4afSLai Jiangshan 	}
4245173b4afSLai Jiangshan }
4255173b4afSLai Jiangshan 
4265cd19aa0SPekka Enberg static void resolve_program(const char *src, char *dst, size_t len)
4275cd19aa0SPekka Enberg {
4285cd19aa0SPekka Enberg 	struct stat st;
429c2c742d9SPekka Enberg 	int err;
4305cd19aa0SPekka Enberg 
431c2c742d9SPekka Enberg 	err = stat(src, &st);
4325cd19aa0SPekka Enberg 
433c2c742d9SPekka Enberg 	if (!err && S_ISREG(st.st_mode)) {
4345cd19aa0SPekka Enberg 		char resolved_path[PATH_MAX];
4355cd19aa0SPekka Enberg 
436de3f75c9SPekka Enberg 		if (!realpath(src, resolved_path))
437de3f75c9SPekka Enberg 			die("Unable to resolve program %s: %s\n", src, strerror(errno));
4385cd19aa0SPekka Enberg 
4395cd19aa0SPekka Enberg 		snprintf(dst, len, "/host%s", resolved_path);
4405cd19aa0SPekka Enberg 	} else
4415cd19aa0SPekka Enberg 		strncpy(dst, src, len);
4425cd19aa0SPekka Enberg }
4435cd19aa0SPekka Enberg 
4444346fd8fSSasha Levin static void kvm_run_write_sandbox_cmd(struct kvm *kvm, const char **argv, int argc)
4453c29e2aaSSasha Levin {
4463c29e2aaSSasha Levin 	const char script_hdr[] = "#! /bin/bash\n\n";
4475cd19aa0SPekka Enberg 	char program[PATH_MAX];
4483c29e2aaSSasha Levin 	int fd;
4493c29e2aaSSasha Levin 
45047621338SSasha Levin 	remove(kvm->cfg.sandbox);
4513c29e2aaSSasha Levin 
45247621338SSasha Levin 	fd = open(kvm->cfg.sandbox, O_RDWR | O_CREAT, 0777);
4533c29e2aaSSasha Levin 	if (fd < 0)
4543c29e2aaSSasha Levin 		die("Failed creating sandbox script");
4553c29e2aaSSasha Levin 
4563c29e2aaSSasha Levin 	if (write(fd, script_hdr, sizeof(script_hdr) - 1) <= 0)
4573c29e2aaSSasha Levin 		die("Failed writing sandbox script");
4583c29e2aaSSasha Levin 
4595cd19aa0SPekka Enberg 	resolve_program(argv[0], program, PATH_MAX);
4605cd19aa0SPekka Enberg 	kvm_write_sandbox_cmd_exactly(fd, program);
4615cd19aa0SPekka Enberg 
4625cd19aa0SPekka Enberg 	argv++;
4635cd19aa0SPekka Enberg 	argc--;
4645cd19aa0SPekka Enberg 
4653c29e2aaSSasha Levin 	while (argc) {
4663c29e2aaSSasha Levin 		if (write(fd, " ", 1) <= 0)
4673c29e2aaSSasha Levin 			die("Failed writing sandbox script");
4685cd19aa0SPekka Enberg 
4695cd19aa0SPekka Enberg 		kvm_write_sandbox_cmd_exactly(fd, argv[0]);
4703c29e2aaSSasha Levin 		argv++;
4713c29e2aaSSasha Levin 		argc--;
4723c29e2aaSSasha Levin 	}
4733c29e2aaSSasha Levin 	if (write(fd, "\n", 1) <= 0)
4743c29e2aaSSasha Levin 		die("Failed writing sandbox script");
4753c29e2aaSSasha Levin 
4763c29e2aaSSasha Levin 	close(fd);
4773c29e2aaSSasha Levin }
4783c29e2aaSSasha Levin 
4794346fd8fSSasha Levin static struct kvm *kvm_cmd_run_init(int argc, const char **argv)
480f967c427SPrasad Joshi {
4812d96f6b6SSasha Levin 	static char real_cmdline[2048], default_name[20];
482384922b3SPekka Enberg 	unsigned int nr_online_cpus;
4834346fd8fSSasha Levin 	struct kvm *kvm = kvm__new();
48447621338SSasha Levin 
48547621338SSasha Levin 	if (IS_ERR(kvm))
4864346fd8fSSasha Levin 		return kvm;
487f967c427SPrasad Joshi 
488cfd63bbbSSasha Levin 	nr_online_cpus = sysconf(_SC_NPROCESSORS_ONLN);
48947621338SSasha Levin 	kvm->cfg.custom_rootfs_name = "default";
490cfd63bbbSSasha Levin 
491f967c427SPrasad Joshi 	while (argc != 0) {
4923b55dcdeSSasha Levin 		BUILD_OPTIONS(options, &kvm->cfg, kvm);
493f967c427SPrasad Joshi 		argc = parse_options(argc, argv, options, run_usage,
4941a007c82SSasha Levin 				PARSE_OPT_STOP_AT_NON_OPTION |
4951a007c82SSasha Levin 				PARSE_OPT_KEEP_DASHDASH);
496f967c427SPrasad Joshi 		if (argc != 0) {
4971a007c82SSasha Levin 			/* Cusrom options, should have been handled elsewhere */
4983c29e2aaSSasha Levin 			if (strcmp(argv[0], "--") == 0) {
4993c29e2aaSSasha Levin 				if (kvm_run_wrapper == KVM_RUN_SANDBOX) {
50047621338SSasha Levin 					kvm->cfg.sandbox = DEFAULT_SANDBOX_FILENAME;
5014346fd8fSSasha Levin 					kvm_run_write_sandbox_cmd(kvm, argv+1, argc-1);
5021a007c82SSasha Levin 					break;
5033c29e2aaSSasha Levin 				}
5043c29e2aaSSasha Levin 			}
5051a007c82SSasha Levin 
50647621338SSasha Levin 			if ((kvm_run_wrapper == KVM_RUN_DEFAULT && kvm->cfg.kernel_filename) ||
50747621338SSasha Levin 				(kvm_run_wrapper == KVM_RUN_SANDBOX && kvm->cfg.sandbox)) {
508f967c427SPrasad Joshi 				fprintf(stderr, "Cannot handle parameter: "
509f967c427SPrasad Joshi 						"%s\n", argv[0]);
510f967c427SPrasad Joshi 				usage_with_options(run_usage, options);
51147621338SSasha Levin 				free(kvm);
5124346fd8fSSasha Levin 				return ERR_PTR(-EINVAL);
513f967c427SPrasad Joshi 			}
514e0747665SSasha Levin 			if (kvm_run_wrapper == KVM_RUN_SANDBOX) {
515e0747665SSasha Levin 				/*
516e0747665SSasha Levin 				 * first unhandled parameter is treated as
517e0747665SSasha Levin 				 * sandbox command
518e0747665SSasha Levin 				 */
51947621338SSasha Levin 				kvm->cfg.sandbox = DEFAULT_SANDBOX_FILENAME;
5204346fd8fSSasha Levin 				kvm_run_write_sandbox_cmd(kvm, argv, argc);
521e0747665SSasha Levin 			} else {
522e0747665SSasha Levin 				/*
523e0747665SSasha Levin 				 * first unhandled parameter is treated as a kernel
524e0747665SSasha Levin 				 * image
525f967c427SPrasad Joshi 				 */
52647621338SSasha Levin 				kvm->cfg.kernel_filename = argv[0];
527e0747665SSasha Levin 			}
528f967c427SPrasad Joshi 			argv++;
529f967c427SPrasad Joshi 			argc--;
530f967c427SPrasad Joshi 		}
531f967c427SPrasad Joshi 
532f967c427SPrasad Joshi 	}
533f967c427SPrasad Joshi 
5343b55dcdeSSasha Levin 	kvm->nr_disks = kvm->cfg.image_count;
5353b55dcdeSSasha Levin 
53647621338SSasha Levin 	if (!kvm->cfg.kernel_filename)
53747621338SSasha Levin 		kvm->cfg.kernel_filename = find_kernel();
5388329f30bSPekka Enberg 
53947621338SSasha Levin 	if (!kvm->cfg.kernel_filename) {
540e08c0896SPrasad Joshi 		kernel_usage_with_options();
5414346fd8fSSasha Levin 		return ERR_PTR(-EINVAL);
5428329f30bSPekka Enberg 	}
5438329f30bSPekka Enberg 
54447621338SSasha Levin 	kvm->cfg.vmlinux_filename = find_vmlinux();
545084a1356SSasha Levin 	kvm->vmlinux = kvm->cfg.vmlinux_filename;
546b0b42ba0SPekka Enberg 
54700ebbe96SSasha Levin 	if (kvm->cfg.nrcpus == 0)
54800ebbe96SSasha Levin 		kvm->cfg.nrcpus = nr_online_cpus;
549d77a9efaSCyrill Gorcunov 
55047621338SSasha Levin 	if (!kvm->cfg.ram_size)
55100ebbe96SSasha Levin 		kvm->cfg.ram_size = get_ram_size(kvm->cfg.nrcpus);
552fd834defSPekka Enberg 
55347621338SSasha Levin 	if (kvm->cfg.ram_size > host_ram_size())
554*69f50425SAndreas Herrmann 		pr_warning("Guest memory size %lluMB exceeds host physical RAM size %lluMB",
555*69f50425SAndreas Herrmann 			(unsigned long long)kvm->cfg.ram_size,
556*69f50425SAndreas Herrmann 			(unsigned long long)host_ram_size());
55760ded003SPekka Enberg 
55847621338SSasha Levin 	kvm->cfg.ram_size <<= MB_SHIFT;
559f967c427SPrasad Joshi 
56047621338SSasha Levin 	if (!kvm->cfg.dev)
56147621338SSasha Levin 		kvm->cfg.dev = DEFAULT_KVM_DEV;
562f967c427SPrasad Joshi 
56347621338SSasha Levin 	if (!kvm->cfg.console)
56447621338SSasha Levin 		kvm->cfg.console = DEFAULT_CONSOLE;
5659aa4a0ebSAsias He 
56647621338SSasha Levin 	if (!strncmp(kvm->cfg.console, "virtio", 6))
5672651ea58SSasha Levin 		kvm->cfg.active_console  = CONSOLE_VIRTIO;
56847621338SSasha Levin 	else if (!strncmp(kvm->cfg.console, "serial", 6))
5692651ea58SSasha Levin 		kvm->cfg.active_console  = CONSOLE_8250;
57047621338SSasha Levin 	else if (!strncmp(kvm->cfg.console, "hv", 2))
5712651ea58SSasha Levin 		kvm->cfg.active_console = CONSOLE_HV;
5723bbc49b6SMatt Evans 	else
5733bbc49b6SMatt Evans 		pr_warning("No console!");
574f967c427SPrasad Joshi 
57547621338SSasha Levin 	if (!kvm->cfg.host_ip)
57647621338SSasha Levin 		kvm->cfg.host_ip = DEFAULT_HOST_ADDR;
5774d67c820SSasha Levin 
57847621338SSasha Levin 	if (!kvm->cfg.guest_ip)
57947621338SSasha Levin 		kvm->cfg.guest_ip = DEFAULT_GUEST_ADDR;
580bb8ffd2fSAsias He 
58147621338SSasha Levin 	if (!kvm->cfg.guest_mac)
58247621338SSasha Levin 		kvm->cfg.guest_mac = DEFAULT_GUEST_MAC;
583a4e724ddSSasha Levin 
58447621338SSasha Levin 	if (!kvm->cfg.host_mac)
58547621338SSasha Levin 		kvm->cfg.host_mac = DEFAULT_HOST_MAC;
586d7098b9bSAsias He 
58747621338SSasha Levin 	if (!kvm->cfg.script)
58847621338SSasha Levin 		kvm->cfg.script = DEFAULT_SCRIPT;
58973b7d038SAmos Kong 
590cf5323a3SSasha Levin 	if (!kvm->cfg.network)
591cf5323a3SSasha Levin                 kvm->cfg.network = DEFAULT_NETWORK;
592cf5323a3SSasha Levin 
593084a1356SSasha Levin 	memset(real_cmdline, 0, sizeof(real_cmdline));
5947bcceb95SPekka Enberg 	kvm__arch_set_cmdline(real_cmdline, kvm->cfg.vnc || kvm->cfg.sdl || kvm->cfg.gtk);
595084a1356SSasha Levin 
596084a1356SSasha Levin 	if (strlen(real_cmdline) > 0)
597084a1356SSasha Levin 		strcat(real_cmdline, " ");
598084a1356SSasha Levin 
599084a1356SSasha Levin 	if (kvm->cfg.kernel_cmdline)
600084a1356SSasha Levin 		strlcat(real_cmdline, kvm->cfg.kernel_cmdline, sizeof(real_cmdline));
601f967c427SPrasad Joshi 
60247621338SSasha Levin 	if (!kvm->cfg.guest_name) {
60347621338SSasha Levin 		if (kvm->cfg.custom_rootfs) {
60447621338SSasha Levin 			kvm->cfg.guest_name = kvm->cfg.custom_rootfs_name;
605587a4d17SLai Jiangshan 		} else {
6062d96f6b6SSasha Levin 			sprintf(default_name, "guest-%u", getpid());
60747621338SSasha Levin 			kvm->cfg.guest_name = default_name;
6082d96f6b6SSasha Levin 		}
609587a4d17SLai Jiangshan 	}
6102d96f6b6SSasha Levin 
61147621338SSasha Levin 	if (!kvm->cfg.using_rootfs && !kvm->cfg.disk_image[0].filename && !kvm->cfg.initrd_filename) {
612c8675741SSasha Levin 		char tmp[PATH_MAX];
6136df1471eSPekka Enberg 
61447621338SSasha Levin 		kvm_setup_create_new(kvm->cfg.custom_rootfs_name);
61547621338SSasha Levin 		kvm_setup_resolv(kvm->cfg.custom_rootfs_name);
616c8675741SSasha Levin 
6179667701cSPekka Enberg 		snprintf(tmp, PATH_MAX, "%s%s", kvm__get_dir(), "default");
618c8675741SSasha Levin 		if (virtio_9p__register(kvm, tmp, "/dev/root") < 0)
619c8675741SSasha Levin 			die("Unable to initialize virtio 9p");
620c8675741SSasha Levin 		if (virtio_9p__register(kvm, "/", "hostfs") < 0)
621c8675741SSasha Levin 			die("Unable to initialize virtio 9p");
62247621338SSasha Levin 		kvm->cfg.using_rootfs = kvm->cfg.custom_rootfs = 1;
62326c853e4SPrasad Joshi 	}
62426c853e4SPrasad Joshi 
62547621338SSasha Levin 	if (kvm->cfg.using_rootfs) {
626ff42603fSSasha Levin 		strcat(real_cmdline, " root=/dev/root rw rootflags=rw,trans=virtio,version=9p2000.L rootfstype=9p");
62747621338SSasha Levin 		if (kvm->cfg.custom_rootfs) {
6284346fd8fSSasha Levin 			kvm_run_set_sandbox(kvm);
629d50fe489SSasha Levin 
630a8e6b4b9SSasha Levin 			strcat(real_cmdline, " init=/virt/init");
631d50fe489SSasha Levin 
63247621338SSasha Levin 			if (!kvm->cfg.no_dhcp)
633a8e6b4b9SSasha Levin 				strcat(real_cmdline, "  ip=dhcp");
6344346fd8fSSasha Levin 			if (kvm_setup_guest_init(kvm))
635afc2c7c0SAsias He 				die("Failed to setup init for guest.");
636a8e6b4b9SSasha Levin 		}
63782d65b5eSSasha Levin 	} else if (!strstr(real_cmdline, "root=")) {
638ff42603fSSasha Levin 		strlcat(real_cmdline, " root=/dev/vda rw ", sizeof(real_cmdline));
63982d65b5eSSasha Levin 	}
64059aa2d30SSasha Levin 
641084a1356SSasha Levin 	kvm->cfg.real_cmdline = real_cmdline;
642084a1356SSasha Levin 
643084a1356SSasha Levin 	printf("  # %s run -k %s -m %Lu -c %d --name %s\n", KVM_BINARY_NAME,
644*69f50425SAndreas Herrmann 		kvm->cfg.kernel_filename,
645*69f50425SAndreas Herrmann 		(unsigned long long)kvm->cfg.ram_size / 1024 / 1024,
646*69f50425SAndreas Herrmann 		kvm->cfg.nrcpus, kvm->cfg.guest_name);
647084a1356SSasha Levin 
6485b403dbfSWill Deacon 	if (init_list__init(kvm) < 0)
6495b403dbfSWill Deacon 		die ("Initialisation failed");
6504346fd8fSSasha Levin 
6514346fd8fSSasha Levin 	return kvm;
652e1e46fe6SSasha Levin }
653e1e46fe6SSasha Levin 
6544346fd8fSSasha Levin static int kvm_cmd_run_work(struct kvm *kvm)
655e1e46fe6SSasha Levin {
656df4239fbSSasha Levin 	int i;
657e1e46fe6SSasha Levin 	void *ret = NULL;
658e1e46fe6SSasha Levin 
65900ebbe96SSasha Levin 	for (i = 0; i < kvm->nrcpus; i++) {
660df4239fbSSasha Levin 		if (pthread_create(&kvm->cpus[i]->thread, NULL, kvm_cpu_thread, kvm->cpus[i]) != 0)
6615ee154d1SPekka Enberg 			die("unable to create KVM VCPU thread");
6625ee154d1SPekka Enberg 	}
6635ee154d1SPekka Enberg 
66449e5227dSSasha Levin 	/* Only VCPU #0 is going to exit by itself when shutting down */
665df4239fbSSasha Levin 	return pthread_join(kvm->cpus[0]->thread, &ret);
666e1e46fe6SSasha Levin }
667e1e46fe6SSasha Levin 
6684346fd8fSSasha Levin static void kvm_cmd_run_exit(struct kvm *kvm, int guest_ret)
669e1e46fe6SSasha Levin {
670e6694207SSasha Levin 	compat__print_all_messages();
671e6694207SSasha Levin 
67249a8afd1SSasha Levin 	init_list__exit(kvm);
673f967c427SPrasad Joshi 
674e1e46fe6SSasha Levin 	if (guest_ret == 0)
675f967c427SPrasad Joshi 		printf("\n  # KVM session ended normally.\n");
676e1e46fe6SSasha Levin }
677e1e46fe6SSasha Levin 
678e1e46fe6SSasha Levin int kvm_cmd_run(int argc, const char **argv, const char *prefix)
679e1e46fe6SSasha Levin {
6804346fd8fSSasha Levin 	int ret = -EFAULT;
6814346fd8fSSasha Levin 	struct kvm *kvm;
682e1e46fe6SSasha Levin 
6834346fd8fSSasha Levin 	kvm = kvm_cmd_run_init(argc, argv);
6844346fd8fSSasha Levin 	if (IS_ERR(kvm))
6854346fd8fSSasha Levin 		return PTR_ERR(kvm);
686e1e46fe6SSasha Levin 
6874346fd8fSSasha Levin 	ret = kvm_cmd_run_work(kvm);
6884346fd8fSSasha Levin 	kvm_cmd_run_exit(kvm, ret);
689e1e46fe6SSasha Levin 
690e1e46fe6SSasha Levin 	return ret;
691f967c427SPrasad Joshi }
692