xref: /kvmtool/builtin-run.c (revision e342083c127d150f36289a0dbcfe153f15bbd73b)
1f967c427SPrasad Joshi #include <stdio.h>
2f967c427SPrasad Joshi #include <string.h>
3f967c427SPrasad Joshi #include <signal.h>
4f967c427SPrasad Joshi #include <unistd.h>
5f967c427SPrasad Joshi #include <stdlib.h>
6f967c427SPrasad Joshi #include <termios.h>
78329f30bSPekka Enberg #include <sys/utsname.h>
88329f30bSPekka Enberg #include <sys/types.h>
98329f30bSPekka Enberg #include <sys/stat.h>
1026c853e4SPrasad Joshi #include <ctype.h>
11f967c427SPrasad Joshi 
12f967c427SPrasad Joshi /* user defined header files */
13f967c427SPrasad Joshi #include <linux/types.h>
14f967c427SPrasad Joshi #include <kvm/kvm.h>
155c3d55faSPekka Enberg #include <kvm/kvm-cpu.h>
16f967c427SPrasad Joshi #include <kvm/8250-serial.h>
17f967c427SPrasad Joshi #include <kvm/virtio-blk.h>
184f56d42cSAsias He #include <kvm/virtio-net.h>
19f967c427SPrasad Joshi #include <kvm/virtio-console.h>
2053eca082SSasha Levin #include <kvm/virtio-rng.h>
21f967c427SPrasad Joshi #include <kvm/disk-image.h>
22f967c427SPrasad Joshi #include <kvm/util.h>
23f967c427SPrasad Joshi #include <kvm/pci.h>
2464136c1cSPekka Enberg #include <kvm/rtc.h>
25f967c427SPrasad Joshi #include <kvm/term.h>
26ac38f433SPekka Enberg #include <kvm/ioport.h>
27d60bafe5SSasha Levin #include <kvm/threadpool.h>
28cffeab25SIngo Molnar #include <kvm/barrier.h>
29b0b42ba0SPekka Enberg #include <kvm/symbol.h>
301c7850f9SSasha Levin #include <kvm/virtio-9p.h>
315ffd4178SJohn Floren #include <kvm/vesa.h>
3237f3d50eSSasha Levin #include <kvm/ioeventfd.h>
33*e342083cSJohn Floren #include <kvm/i8042.h>
34f967c427SPrasad Joshi 
35f967c427SPrasad Joshi /* header files for gitish interface  */
36f967c427SPrasad Joshi #include <kvm/kvm-run.h>
37f967c427SPrasad Joshi #include <kvm/parse-options.h>
38b5b501ccSIngo Molnar #include <kvm/mutex.h>
39f967c427SPrasad Joshi 
40f967c427SPrasad Joshi #define DEFAULT_KVM_DEV		"/dev/kvm"
419aa4a0ebSAsias He #define DEFAULT_CONSOLE		"serial"
423b02f580SSasha Levin #define DEFAULT_NETWORK		"virtio"
434d67c820SSasha Levin #define DEFAULT_HOST_ADDR	"192.168.33.2"
44a4e724ddSSasha Levin #define DEFAULT_GUEST_MAC	"00:11:22:33:44:55"
4573b7d038SAmos Kong #define DEFAULT_SCRIPT		"none"
46f967c427SPrasad Joshi 
47f967c427SPrasad Joshi #define MB_SHIFT		(20)
48a2a002f9SIngo Molnar #define MIN_RAM_SIZE_MB		(64ULL)
49f967c427SPrasad Joshi #define MIN_RAM_SIZE_BYTE	(MIN_RAM_SIZE_MB << MB_SHIFT)
50f967c427SPrasad Joshi 
514298ddadSSasha Levin struct kvm *kvm;
524298ddadSSasha Levin struct kvm_cpu *kvm_cpus[KVM_NR_CPUS];
53656be1b8SSasha Levin __thread struct kvm_cpu *current_kvm_cpu;
54f967c427SPrasad Joshi 
55fd834defSPekka Enberg static u64 ram_size;
56a33979d8SSasha Levin static u8  image_count;
5780ac1d05SSasha Levin static int virtio_rng;
58f967c427SPrasad Joshi static const char *kernel_cmdline;
59f967c427SPrasad Joshi static const char *kernel_filename;
60b0b42ba0SPekka Enberg static const char *vmlinux_filename;
61f967c427SPrasad Joshi static const char *initrd_filename;
62a33979d8SSasha Levin static const char *image_filename[MAX_DISK_IMAGES];
639aa4a0ebSAsias He static const char *console;
64f967c427SPrasad Joshi static const char *kvm_dev;
654f56d42cSAsias He static const char *network;
664d67c820SSasha Levin static const char *host_ip_addr;
67a4e724ddSSasha Levin static const char *guest_mac;
6873b7d038SAmos Kong static const char *script;
691c7850f9SSasha Levin static const char *virtio_9p_dir;
700ea58e5bSPekka Enberg static bool single_step;
71a33979d8SSasha Levin static bool readonly_image[MAX_DISK_IMAGES];
725ffd4178SJohn Floren static bool vnc;
73f967c427SPrasad Joshi extern bool ioport_debug;
74f967c427SPrasad Joshi extern int  active_console;
75f967c427SPrasad Joshi 
76ed036f03SCyrill Gorcunov bool do_debug_print = false;
77ed036f03SCyrill Gorcunov 
78cfd63bbbSSasha Levin static int nrcpus;
79d77a9efaSCyrill Gorcunov 
80f967c427SPrasad Joshi static const char * const run_usage[] = {
818329f30bSPekka Enberg 	"kvm run [<options>] [<kernel image>]",
82f967c427SPrasad Joshi 	NULL
83f967c427SPrasad Joshi };
84f967c427SPrasad Joshi 
85a33979d8SSasha Levin static int img_name_parser(const struct option *opt, const char *arg, int unset)
86a33979d8SSasha Levin {
87a33979d8SSasha Levin 	char *sep;
88a33979d8SSasha Levin 
89a33979d8SSasha Levin 	if (image_count >= MAX_DISK_IMAGES)
90a33979d8SSasha Levin 		die("Currently only 4 images are supported");
91a33979d8SSasha Levin 
92a33979d8SSasha Levin 	image_filename[image_count] = arg;
93a33979d8SSasha Levin 	sep = strstr(arg, ",");
94a33979d8SSasha Levin 	if (sep) {
95a33979d8SSasha Levin 		if (strcmp(sep + 1, "ro") == 0)
96a33979d8SSasha Levin 			readonly_image[image_count] = 1;
97a33979d8SSasha Levin 		*sep = 0;
98a33979d8SSasha Levin 	}
99a33979d8SSasha Levin 
100a33979d8SSasha Levin 	image_count++;
101a33979d8SSasha Levin 
102a33979d8SSasha Levin 	return 0;
103a33979d8SSasha Levin }
104a33979d8SSasha Levin 
105f967c427SPrasad Joshi static const struct option options[] = {
1065e3af62dSSasha Levin 	OPT_GROUP("Basic options:"),
10780b1f72fSPekka Enberg 	OPT_INTEGER('c', "cpus", &nrcpus, "Number of CPUs"),
108f967c427SPrasad Joshi 	OPT_U64('m', "mem", &ram_size, "Virtual machine memory size in MiB."),
109d6c19027SAsias He 	OPT_CALLBACK('d', "disk", NULL, "image", "Disk image", img_name_parser),
11080b1f72fSPekka Enberg 	OPT_STRING('\0', "console", &console, "serial or virtio",
1115e3af62dSSasha Levin 			"Console to use"),
11280ac1d05SSasha Levin 	OPT_INCR('\0', "rng", &virtio_rng,
11353eca082SSasha Levin 			"Enable virtio Random Number Generator"),
114d6c19027SAsias He 	OPT_STRING('\0', "kvm-dev", &kvm_dev, "kvm-dev", "KVM device file"),
1151c7850f9SSasha Levin 	OPT_STRING('\0', "virtio-9p", &virtio_9p_dir, "root dir",
1161c7850f9SSasha Levin 			"Enable 9p over virtio"),
1175ffd4178SJohn Floren 	OPT_BOOLEAN('\0', "vnc", &vnc, "Enable VNC framebuffer"),
1185e3af62dSSasha Levin 
1195e3af62dSSasha Levin 	OPT_GROUP("Kernel options:"),
1205e3af62dSSasha Levin 	OPT_STRING('k', "kernel", &kernel_filename, "kernel",
1215e3af62dSSasha Levin 			"Kernel to boot in virtual machine"),
122d6c19027SAsias He 	OPT_STRING('i', "initrd", &initrd_filename, "initrd",
1235e3af62dSSasha Levin 			"Initial RAM disk image"),
1245e3af62dSSasha Levin 	OPT_STRING('p', "params", &kernel_cmdline, "params",
1255e3af62dSSasha Levin 			"Kernel command line arguments"),
1265e3af62dSSasha Levin 
1274d67c820SSasha Levin 	OPT_GROUP("Networking options:"),
1284d67c820SSasha Levin 	OPT_STRING('n', "network", &network, "virtio",
1294d67c820SSasha Levin 			"Network to use"),
1304d67c820SSasha Levin 	OPT_STRING('\0', "host-ip-addr", &host_ip_addr, "a.b.c.d",
1314d67c820SSasha Levin 			"Assign this address to the host side networking"),
132a4e724ddSSasha Levin 	OPT_STRING('\0', "guest-mac", &guest_mac, "aa:bb:cc:dd:ee:ff",
133a4e724ddSSasha Levin 			"Assign this address to the guest side NIC"),
13473b7d038SAmos Kong 	OPT_STRING('\0', "tapscript", &script, "Script path",
13573b7d038SAmos Kong 			 "Assign a script to process created tap device"),
136d6c19027SAsias He 
1375e3af62dSSasha Levin 	OPT_GROUP("Debug options:"),
138ed036f03SCyrill Gorcunov 	OPT_BOOLEAN('\0', "debug", &do_debug_print,
139ed036f03SCyrill Gorcunov 			"Enable debug messages"),
140d6c19027SAsias He 	OPT_BOOLEAN('\0', "debug-single-step", &single_step,
141d6c19027SAsias He 			"Enable single stepping"),
142d6c19027SAsias He 	OPT_BOOLEAN('\0', "debug-ioport-debug", &ioport_debug,
143d6c19027SAsias He 			"Enable ioport debugging"),
144f967c427SPrasad Joshi 	OPT_END()
145f967c427SPrasad Joshi };
146f967c427SPrasad Joshi 
147b5b501ccSIngo Molnar /*
148b5b501ccSIngo Molnar  * Serialize debug printout so that the output of multiple vcpus does not
149b5b501ccSIngo Molnar  * get mixed up:
150b5b501ccSIngo Molnar  */
151cffeab25SIngo Molnar static int printout_done;
152b5b501ccSIngo Molnar 
15343119af7SPekka Enberg static void handle_sigusr1(int sig)
15443119af7SPekka Enberg {
15543119af7SPekka Enberg 	struct kvm_cpu *cpu = current_kvm_cpu;
15643119af7SPekka Enberg 
15743119af7SPekka Enberg 	if (!cpu)
15843119af7SPekka Enberg 		return;
15943119af7SPekka Enberg 
160b5b501ccSIngo Molnar 	printf("\n #\n # vCPU #%ld's dump:\n #\n", cpu->cpu_id);
16143119af7SPekka Enberg 	kvm_cpu__show_registers(cpu);
16243119af7SPekka Enberg 	kvm_cpu__show_code(cpu);
16343119af7SPekka Enberg 	kvm_cpu__show_page_tables(cpu);
164b5b501ccSIngo Molnar 	fflush(stdout);
165cffeab25SIngo Molnar 	printout_done = 1;
166cffeab25SIngo Molnar 	mb();
16743119af7SPekka Enberg }
16843119af7SPekka Enberg 
169d94e22b9SSasha Levin /* Pause/resume the guest using SIGUSR2 */
170d94e22b9SSasha Levin static int is_paused;
171d94e22b9SSasha Levin 
172d94e22b9SSasha Levin static void handle_sigusr2(int sig)
173d94e22b9SSasha Levin {
174d94e22b9SSasha Levin 	if (is_paused)
175d94e22b9SSasha Levin 		kvm__continue();
176d94e22b9SSasha Levin 	else
177d94e22b9SSasha Levin 		kvm__pause();
178d94e22b9SSasha Levin 
179d94e22b9SSasha Levin 	is_paused = !is_paused;
180d94e22b9SSasha Levin 	pr_info("Guest %s\n", is_paused ? "paused" : "resumed");
181d94e22b9SSasha Levin }
182d94e22b9SSasha Levin 
1839e854d1aSPekka Enberg static void handle_sigquit(int sig)
1849e854d1aSPekka Enberg {
1859e854d1aSPekka Enberg 	int i;
1869e854d1aSPekka Enberg 
1879e854d1aSPekka Enberg 	for (i = 0; i < nrcpus; i++) {
1889e854d1aSPekka Enberg 		struct kvm_cpu *cpu = kvm_cpus[i];
1899e854d1aSPekka Enberg 
19043119af7SPekka Enberg 		if (!cpu)
19143119af7SPekka Enberg 			continue;
19243119af7SPekka Enberg 
193cffeab25SIngo Molnar 		printout_done = 0;
19443119af7SPekka Enberg 		pthread_kill(cpu->thread, SIGUSR1);
195cffeab25SIngo Molnar 		/*
196cffeab25SIngo Molnar 		 * Wait for the vCPU to dump state before signalling
197cffeab25SIngo Molnar 		 * the next thread. Since this is debug code it does
198cffeab25SIngo Molnar 		 * not matter that we are burning CPU time a bit:
199cffeab25SIngo Molnar 		 */
200cffeab25SIngo Molnar 		while (!printout_done)
201cffeab25SIngo Molnar 			mb();
2029e854d1aSPekka Enberg 	}
2039e854d1aSPekka Enberg 
2049e854d1aSPekka Enberg 	serial8250__inject_sysrq(kvm);
2059e854d1aSPekka Enberg }
2069e854d1aSPekka Enberg 
2079e854d1aSPekka Enberg static void handle_sigalrm(int sig)
2089e854d1aSPekka Enberg {
2099e854d1aSPekka Enberg 	serial8250__inject_interrupt(kvm);
2109e854d1aSPekka Enberg 	virtio_console__inject_interrupt(kvm);
2119e854d1aSPekka Enberg }
2129e854d1aSPekka Enberg 
2135ee154d1SPekka Enberg static void *kvm_cpu_thread(void *arg)
2145ee154d1SPekka Enberg {
215d77a9efaSCyrill Gorcunov 	current_kvm_cpu		= arg;
2165ee154d1SPekka Enberg 
217d77a9efaSCyrill Gorcunov 	if (kvm_cpu__start(current_kvm_cpu))
2185ee154d1SPekka Enberg 		goto panic_kvm;
2195ee154d1SPekka Enberg 
220d77a9efaSCyrill Gorcunov 	kvm_cpu__delete(current_kvm_cpu);
2215ee154d1SPekka Enberg 
2225ee154d1SPekka Enberg 	return (void *) (intptr_t) 0;
2235ee154d1SPekka Enberg 
2245ee154d1SPekka Enberg panic_kvm:
2253fdf659dSSasha Levin 	fprintf(stderr, "KVM exit reason: %u (\"%s\")\n",
226d77a9efaSCyrill Gorcunov 		current_kvm_cpu->kvm_run->exit_reason,
227d77a9efaSCyrill Gorcunov 		kvm_exit_reasons[current_kvm_cpu->kvm_run->exit_reason]);
228d77a9efaSCyrill Gorcunov 	if (current_kvm_cpu->kvm_run->exit_reason == KVM_EXIT_UNKNOWN)
2295ee154d1SPekka Enberg 		fprintf(stderr, "KVM exit code: 0x%Lu\n",
230d77a9efaSCyrill Gorcunov 			current_kvm_cpu->kvm_run->hw.hardware_exit_reason);
2318e5accedSPekka Enberg 
232d77a9efaSCyrill Gorcunov 	kvm_cpu__show_registers(current_kvm_cpu);
233d77a9efaSCyrill Gorcunov 	kvm_cpu__show_code(current_kvm_cpu);
234d77a9efaSCyrill Gorcunov 	kvm_cpu__show_page_tables(current_kvm_cpu);
2355ee154d1SPekka Enberg 
236d77a9efaSCyrill Gorcunov 	kvm_cpu__delete(current_kvm_cpu);
2375ee154d1SPekka Enberg 
2385ee154d1SPekka Enberg 	return (void *) (intptr_t) 1;
2395ee154d1SPekka Enberg }
2405ee154d1SPekka Enberg 
241e08c0896SPrasad Joshi static char kernel[PATH_MAX];
242b0b42ba0SPekka Enberg 
243b0b42ba0SPekka Enberg static const char *host_kernels[] = {
244e08c0896SPrasad Joshi 	"/boot/vmlinuz",
245e08c0896SPrasad Joshi 	"/boot/bzImage",
246e08c0896SPrasad Joshi 	NULL
247e08c0896SPrasad Joshi };
248b0b42ba0SPekka Enberg 
249b0b42ba0SPekka Enberg static const char *default_kernels[] = {
250e08c0896SPrasad Joshi 	"./bzImage",
251e08c0896SPrasad Joshi 	"../../arch/x86/boot/bzImage",
252e08c0896SPrasad Joshi 	NULL
253e08c0896SPrasad Joshi };
2548329f30bSPekka Enberg 
255b0b42ba0SPekka Enberg static const char *default_vmlinux[] = {
256b0b42ba0SPekka Enberg 	"../../../vmlinux",
257b0b42ba0SPekka Enberg 	"../../vmlinux",
258b0b42ba0SPekka Enberg 	NULL
259b0b42ba0SPekka Enberg };
260b0b42ba0SPekka Enberg 
261e08c0896SPrasad Joshi static void kernel_usage_with_options(void)
2628329f30bSPekka Enberg {
263e08c0896SPrasad Joshi 	const char **k;
2648329f30bSPekka Enberg 	struct utsname uts;
265e08c0896SPrasad Joshi 
266e08c0896SPrasad Joshi 	fprintf(stderr, "Fatal: could not find default kernel image in:\n");
26765182f37SPrasad Joshi 	k = &default_kernels[0];
268e08c0896SPrasad Joshi 	while (*k) {
269e08c0896SPrasad Joshi 		fprintf(stderr, "\t%s\n", *k);
270e08c0896SPrasad Joshi 		k++;
271e08c0896SPrasad Joshi 	}
272e08c0896SPrasad Joshi 
273e08c0896SPrasad Joshi 	if (uname(&uts) < 0)
274e08c0896SPrasad Joshi 		return;
275e08c0896SPrasad Joshi 
276e08c0896SPrasad Joshi 	k = &host_kernels[0];
277e08c0896SPrasad Joshi 	while (*k) {
278e08c0896SPrasad Joshi 		if (snprintf(kernel, PATH_MAX, "%s-%s", *k, uts.release) < 0)
279e08c0896SPrasad Joshi 			return;
280e08c0896SPrasad Joshi 		fprintf(stderr, "\t%s\n", kernel);
281e08c0896SPrasad Joshi 		k++;
282e08c0896SPrasad Joshi 	}
283a33389d8SPrasad Joshi 	fprintf(stderr, "\nPlease see 'kvm run --help' for more options.\n\n");
284e08c0896SPrasad Joshi }
285e08c0896SPrasad Joshi 
28660ded003SPekka Enberg static u64 host_ram_size(void)
28760ded003SPekka Enberg {
28860ded003SPekka Enberg 	long page_size;
28960ded003SPekka Enberg 	long nr_pages;
29060ded003SPekka Enberg 
29160ded003SPekka Enberg 	nr_pages	= sysconf(_SC_PHYS_PAGES);
292d63c5ce6SPekka Enberg 	if (nr_pages < 0) {
2934542f276SCyrill Gorcunov 		pr_warning("sysconf(_SC_PHYS_PAGES) failed");
294d63c5ce6SPekka Enberg 		return 0;
295d63c5ce6SPekka Enberg 	}
29660ded003SPekka Enberg 
29760ded003SPekka Enberg 	page_size	= sysconf(_SC_PAGE_SIZE);
298d63c5ce6SPekka Enberg 	if (page_size < 0) {
2994542f276SCyrill Gorcunov 		pr_warning("sysconf(_SC_PAGE_SIZE) failed");
300d63c5ce6SPekka Enberg 		return 0;
301d63c5ce6SPekka Enberg 	}
30260ded003SPekka Enberg 
30360ded003SPekka Enberg 	return (nr_pages * page_size) >> MB_SHIFT;
30460ded003SPekka Enberg }
30560ded003SPekka Enberg 
30618bd8c3bSPekka Enberg /*
30718bd8c3bSPekka Enberg  * If user didn't specify how much memory it wants to allocate for the guest,
30818bd8c3bSPekka Enberg  * avoid filling the whole host RAM.
30918bd8c3bSPekka Enberg  */
31018bd8c3bSPekka Enberg #define RAM_SIZE_RATIO		0.8
31118bd8c3bSPekka Enberg 
312fd834defSPekka Enberg static u64 get_ram_size(int nr_cpus)
313fd834defSPekka Enberg {
314fd834defSPekka Enberg 	long available;
315fd834defSPekka Enberg 	long ram_size;
316fd834defSPekka Enberg 
317fd834defSPekka Enberg 	ram_size	= 64 * (nr_cpus + 3);
318fd834defSPekka Enberg 
31960ded003SPekka Enberg 	available	= host_ram_size() * RAM_SIZE_RATIO;
320d63c5ce6SPekka Enberg 	if (!available)
321d63c5ce6SPekka Enberg 		available = MIN_RAM_SIZE_MB;
322fd834defSPekka Enberg 
323fd834defSPekka Enberg 	if (ram_size > available)
324fd834defSPekka Enberg 		ram_size	= available;
325fd834defSPekka Enberg 
326fd834defSPekka Enberg 	return ram_size;
327fd834defSPekka Enberg }
328fd834defSPekka Enberg 
329e08c0896SPrasad Joshi static const char *find_kernel(void)
330e08c0896SPrasad Joshi {
331e08c0896SPrasad Joshi 	const char **k;
3328329f30bSPekka Enberg 	struct stat st;
333e08c0896SPrasad Joshi 	struct utsname uts;
334e08c0896SPrasad Joshi 
33565182f37SPrasad Joshi 	k = &default_kernels[0];
336e08c0896SPrasad Joshi 	while (*k) {
337e08c0896SPrasad Joshi 		if (stat(*k, &st) < 0 || !S_ISREG(st.st_mode)) {
338e08c0896SPrasad Joshi 			k++;
339e08c0896SPrasad Joshi 			continue;
340e08c0896SPrasad Joshi 		}
341e08c0896SPrasad Joshi 		strncpy(kernel, *k, PATH_MAX);
342e08c0896SPrasad Joshi 		return kernel;
343e08c0896SPrasad Joshi 	}
3448329f30bSPekka Enberg 
3458329f30bSPekka Enberg 	if (uname(&uts) < 0)
3468329f30bSPekka Enberg 		return NULL;
3478329f30bSPekka Enberg 
348e08c0896SPrasad Joshi 	k = &host_kernels[0];
349e08c0896SPrasad Joshi 	while (*k) {
350e08c0896SPrasad Joshi 		if (snprintf(kernel, PATH_MAX, "%s-%s", *k, uts.release) < 0)
3518329f30bSPekka Enberg 			return NULL;
3528329f30bSPekka Enberg 
353e08c0896SPrasad Joshi 		if (stat(kernel, &st) < 0 || !S_ISREG(st.st_mode)) {
354e08c0896SPrasad Joshi 			k++;
355e08c0896SPrasad Joshi 			continue;
356e08c0896SPrasad Joshi 		}
357e08c0896SPrasad Joshi 		return kernel;
3588329f30bSPekka Enberg 
359e08c0896SPrasad Joshi 	}
3608329f30bSPekka Enberg 	return NULL;
3618329f30bSPekka Enberg }
3628329f30bSPekka Enberg 
363b0b42ba0SPekka Enberg static const char *find_vmlinux(void)
364b0b42ba0SPekka Enberg {
365b0b42ba0SPekka Enberg 	const char **vmlinux;
366b0b42ba0SPekka Enberg 
367b0b42ba0SPekka Enberg 	vmlinux = &default_vmlinux[0];
368b0b42ba0SPekka Enberg 	while (*vmlinux) {
369b0b42ba0SPekka Enberg 		struct stat st;
370b0b42ba0SPekka Enberg 
371b0b42ba0SPekka Enberg 		if (stat(*vmlinux, &st) < 0 || !S_ISREG(st.st_mode)) {
372b0b42ba0SPekka Enberg 			vmlinux++;
373b0b42ba0SPekka Enberg 			continue;
374b0b42ba0SPekka Enberg 		}
375b0b42ba0SPekka Enberg 		return *vmlinux;
376b0b42ba0SPekka Enberg 	}
377b0b42ba0SPekka Enberg 	return NULL;
378b0b42ba0SPekka Enberg }
379b0b42ba0SPekka Enberg 
38026c853e4SPrasad Joshi static int root_device(char *dev, long *part)
38126c853e4SPrasad Joshi {
38226c853e4SPrasad Joshi 	struct stat st;
38326c853e4SPrasad Joshi 
38405088d56SSasha Levin 	if (stat("/", &st) < 0)
38526c853e4SPrasad Joshi 		return -1;
38626c853e4SPrasad Joshi 
38705088d56SSasha Levin 	*part = minor(st.st_dev);
38826c853e4SPrasad Joshi 
38905088d56SSasha Levin 	sprintf(dev, "/dev/block/%u:0", major(st.st_dev));
390afa0f6c1SPrasad Joshi 	if (access(dev, R_OK) < 0)
391afa0f6c1SPrasad Joshi 		return -1;
392afa0f6c1SPrasad Joshi 
39326c853e4SPrasad Joshi 	return 0;
39426c853e4SPrasad Joshi }
39526c853e4SPrasad Joshi 
39626c853e4SPrasad Joshi static char *host_image(char *cmd_line, size_t size)
39726c853e4SPrasad Joshi {
39826c853e4SPrasad Joshi 	char *t;
39926c853e4SPrasad Joshi 	char device[PATH_MAX];
40026c853e4SPrasad Joshi 	long part = 0;
40126c853e4SPrasad Joshi 
40226c853e4SPrasad Joshi 	t = malloc(PATH_MAX);
40326c853e4SPrasad Joshi 	if (!t)
40426c853e4SPrasad Joshi 		return NULL;
40526c853e4SPrasad Joshi 
40626c853e4SPrasad Joshi 	/* check for the root file system */
40726c853e4SPrasad Joshi 	if (root_device(device, &part) < 0) {
40826c853e4SPrasad Joshi 		free(t);
40926c853e4SPrasad Joshi 		return NULL;
41026c853e4SPrasad Joshi 	}
41126c853e4SPrasad Joshi 	strncpy(t, device, PATH_MAX);
41226c853e4SPrasad Joshi 	if (!strstr(cmd_line, "root=")) {
41326c853e4SPrasad Joshi 		char tmp[PATH_MAX];
41426c853e4SPrasad Joshi 		snprintf(tmp, sizeof(tmp), "root=/dev/vda%ld rw ", part);
41526c853e4SPrasad Joshi 		strlcat(cmd_line, tmp, size);
41626c853e4SPrasad Joshi 	}
41726c853e4SPrasad Joshi 	return t;
41826c853e4SPrasad Joshi }
41926c853e4SPrasad Joshi 
420f6677a1dSAmerigo Wang void kvm_run_help(void)
421f6677a1dSAmerigo Wang {
422f6677a1dSAmerigo Wang 	usage_with_options(run_usage, options);
423f6677a1dSAmerigo Wang }
424f6677a1dSAmerigo Wang 
425f967c427SPrasad Joshi int kvm_cmd_run(int argc, const char **argv, const char *prefix)
426f967c427SPrasad Joshi {
427b0b42ba0SPekka Enberg 	struct virtio_net_parameters net_params;
428f967c427SPrasad Joshi 	static char real_cmdline[2048];
429384922b3SPekka Enberg 	unsigned int nr_online_cpus;
4305ee154d1SPekka Enberg 	int exit_code = 0;
431b0b42ba0SPekka Enberg 	int max_cpus;
43226c853e4SPrasad Joshi 	char *hi;
433b0b42ba0SPekka Enberg 	int i;
43449e5227dSSasha Levin 	void *ret;
4355ffd4178SJohn Floren 	u16 vidmode = 0;
436f967c427SPrasad Joshi 
4375ee154d1SPekka Enberg 	signal(SIGALRM, handle_sigalrm);
438f967c427SPrasad Joshi 	signal(SIGQUIT, handle_sigquit);
43943119af7SPekka Enberg 	signal(SIGUSR1, handle_sigusr1);
440d94e22b9SSasha Levin 	signal(SIGUSR2, handle_sigusr2);
441f967c427SPrasad Joshi 
442cfd63bbbSSasha Levin 	nr_online_cpus = sysconf(_SC_NPROCESSORS_ONLN);
443cfd63bbbSSasha Levin 
444f967c427SPrasad Joshi 	while (argc != 0) {
445f967c427SPrasad Joshi 		argc = parse_options(argc, argv, options, run_usage,
446f967c427SPrasad Joshi 				PARSE_OPT_STOP_AT_NON_OPTION);
447f967c427SPrasad Joshi 		if (argc != 0) {
448f967c427SPrasad Joshi 			if (kernel_filename) {
449f967c427SPrasad Joshi 				fprintf(stderr, "Cannot handle parameter: "
450f967c427SPrasad Joshi 						"%s\n", argv[0]);
451f967c427SPrasad Joshi 				usage_with_options(run_usage, options);
452f967c427SPrasad Joshi 				return EINVAL;
453f967c427SPrasad Joshi 			}
454f967c427SPrasad Joshi 			/* first unhandled parameter is treated as a kernel
455f967c427SPrasad Joshi 			   image
456f967c427SPrasad Joshi 			 */
457f967c427SPrasad Joshi 			kernel_filename = argv[0];
458f967c427SPrasad Joshi 			argv++;
459f967c427SPrasad Joshi 			argc--;
460f967c427SPrasad Joshi 		}
461f967c427SPrasad Joshi 
462f967c427SPrasad Joshi 	}
463f967c427SPrasad Joshi 
46445bc2f02SPekka Enberg 	if (!kernel_filename)
465e08c0896SPrasad Joshi 		kernel_filename = find_kernel();
4668329f30bSPekka Enberg 
4678329f30bSPekka Enberg 	if (!kernel_filename) {
468e08c0896SPrasad Joshi 		kernel_usage_with_options();
4698329f30bSPekka Enberg 		return EINVAL;
4708329f30bSPekka Enberg 	}
4718329f30bSPekka Enberg 
472b0b42ba0SPekka Enberg 	vmlinux_filename = find_vmlinux();
473b0b42ba0SPekka Enberg 
474cfd63bbbSSasha Levin 	if (nrcpus == 0)
475cfd63bbbSSasha Levin 		nrcpus = nr_online_cpus;
476cfd63bbbSSasha Levin 	else if (nrcpus < 1 || nrcpus > KVM_NR_CPUS)
477d77a9efaSCyrill Gorcunov 		die("Number of CPUs %d is out of [1;%d] range", nrcpus, KVM_NR_CPUS);
478d77a9efaSCyrill Gorcunov 
479fd834defSPekka Enberg 	if (!ram_size)
480fd834defSPekka Enberg 		ram_size	= get_ram_size(nrcpus);
481fd834defSPekka Enberg 
482a2a002f9SIngo Molnar 	if (ram_size < MIN_RAM_SIZE_MB)
483a2a002f9SIngo Molnar 		die("Not enough memory specified: %lluMB (min %lluMB)", ram_size, MIN_RAM_SIZE_MB);
484a2a002f9SIngo Molnar 
48560ded003SPekka Enberg 	if (ram_size > host_ram_size())
4864542f276SCyrill Gorcunov 		pr_warning("Guest memory size %lluMB exceeds host physical RAM size %lluMB", ram_size, host_ram_size());
48760ded003SPekka Enberg 
488f967c427SPrasad Joshi 	ram_size <<= MB_SHIFT;
489f967c427SPrasad Joshi 
490f967c427SPrasad Joshi 	if (!kvm_dev)
491f967c427SPrasad Joshi 		kvm_dev = DEFAULT_KVM_DEV;
492f967c427SPrasad Joshi 
4939aa4a0ebSAsias He 	if (!console)
4949aa4a0ebSAsias He 		console = DEFAULT_CONSOLE;
4959aa4a0ebSAsias He 
4969aa4a0ebSAsias He 	if (!strncmp(console, "virtio", 6))
497f967c427SPrasad Joshi 		active_console  = CONSOLE_VIRTIO;
4989aa4a0ebSAsias He 	else
4999aa4a0ebSAsias He 		active_console  = CONSOLE_8250;
500f967c427SPrasad Joshi 
5014d67c820SSasha Levin 	if (!host_ip_addr)
5024d67c820SSasha Levin 		host_ip_addr = DEFAULT_HOST_ADDR;
5034d67c820SSasha Levin 
504a4e724ddSSasha Levin 	if (!guest_mac)
505a4e724ddSSasha Levin 		guest_mac = DEFAULT_GUEST_MAC;
506a4e724ddSSasha Levin 
50773b7d038SAmos Kong 	if (!script)
50873b7d038SAmos Kong 		script = DEFAULT_SCRIPT;
50973b7d038SAmos Kong 
5101c7850f9SSasha Levin 	if (virtio_9p_dir) {
5111c7850f9SSasha Levin 		char tmp[PATH_MAX];
5121c7850f9SSasha Levin 
5131c7850f9SSasha Levin 		if (realpath(virtio_9p_dir, tmp))
5141c7850f9SSasha Levin 			virtio_9p__init(kvm, tmp);
5151c7850f9SSasha Levin 		else
5161c7850f9SSasha Levin 			die("Failed resolving 9p path");
5171c7850f9SSasha Levin 	}
5181c7850f9SSasha Levin 
519b0b42ba0SPekka Enberg 	symbol__init(vmlinux_filename);
520b0b42ba0SPekka Enberg 
521f967c427SPrasad Joshi 	term_init();
522f967c427SPrasad Joshi 
523f967c427SPrasad Joshi 	kvm = kvm__init(kvm_dev, ram_size);
524f967c427SPrasad Joshi 
52537f3d50eSSasha Levin 	ioeventfd__init();
52637f3d50eSSasha Levin 
527384922b3SPekka Enberg 	max_cpus = kvm__max_cpus(kvm);
528384922b3SPekka Enberg 
529384922b3SPekka Enberg 	if (nrcpus > max_cpus) {
530384922b3SPekka Enberg 		printf("  # Limit the number of CPUs to %d\n", max_cpus);
531384922b3SPekka Enberg 		kvm->nrcpus	= max_cpus;
532384922b3SPekka Enberg 	}
533384922b3SPekka Enberg 
5340c7c14a7SCyrill Gorcunov 	kvm->nrcpus = nrcpus;
5350c7c14a7SCyrill Gorcunov 
53626c853e4SPrasad Joshi 	memset(real_cmdline, 0, sizeof(real_cmdline));
5375ffd4178SJohn Floren 	strcpy(real_cmdline, "notsc noapic noacpi pci=conf1");
5385ffd4178SJohn Floren 	if (vnc) {
5395ffd4178SJohn Floren 		strcat(real_cmdline, " video=vesafb console=tty0");
5405ffd4178SJohn Floren 		vidmode = 0x312;
5415ffd4178SJohn Floren 	} else {
5425ffd4178SJohn Floren 		strcat(real_cmdline, " console=ttyS0 earlyprintk=serial");
5435ffd4178SJohn Floren 	}
544d74181ccSSasha Levin 	strcat(real_cmdline, " ");
54526c853e4SPrasad Joshi 	if (kernel_cmdline)
54626c853e4SPrasad Joshi 		strlcat(real_cmdline, kernel_cmdline, sizeof(real_cmdline));
54726c853e4SPrasad Joshi 
54826c853e4SPrasad Joshi 	hi = NULL;
549a33979d8SSasha Levin 	if (!image_filename[0]) {
55026c853e4SPrasad Joshi 		hi = host_image(real_cmdline, sizeof(real_cmdline));
55126c853e4SPrasad Joshi 		if (hi) {
552a33979d8SSasha Levin 			image_filename[0] = hi;
553a33979d8SSasha Levin 			readonly_image[0] = true;
55425bf86f6SSasha Levin 			image_count++;
55526c853e4SPrasad Joshi 		}
55626c853e4SPrasad Joshi 	}
55726c853e4SPrasad Joshi 
55826c853e4SPrasad Joshi 	if (!strstr(real_cmdline, "root="))
55926c853e4SPrasad Joshi 		strlcat(real_cmdline, " root=/dev/vda rw ", sizeof(real_cmdline));
56026c853e4SPrasad Joshi 
561c1ed214eSPrasad Joshi 	if (image_count) {
562bcb6aacaSPrasad Joshi 		kvm->nr_disks = image_count;
563c1ed214eSPrasad Joshi 		kvm->disks    = disk_image__open_all(image_filename, readonly_image, image_count);
564c1ed214eSPrasad Joshi 		if (!kvm->disks)
565c1ed214eSPrasad Joshi 			die("Unable to load all disk images.");
56638605e1cSSasha Levin 
567bcb6aacaSPrasad Joshi 		virtio_blk__init_all(kvm);
568f967c427SPrasad Joshi 	}
569c1ed214eSPrasad Joshi 
57026c853e4SPrasad Joshi 	free(hi);
571f967c427SPrasad Joshi 
5723780b3d5SPekka Enberg 	printf("  # kvm run -k %s -m %Lu -c %d\n", kernel_filename, ram_size / 1024 / 1024, nrcpus);
573471c6facSPekka Enberg 
574f967c427SPrasad Joshi 	if (!kvm__load_kernel(kvm, kernel_filename, initrd_filename,
5755ffd4178SJohn Floren 				real_cmdline, vidmode))
576f967c427SPrasad Joshi 		die("unable to load kernel %s", kernel_filename);
577f967c427SPrasad Joshi 
578b0b42ba0SPekka Enberg 	kvm->vmlinux		= vmlinux_filename;
579b0b42ba0SPekka Enberg 
580ac38f433SPekka Enberg 	ioport__setup_legacy();
581ac38f433SPekka Enberg 
58264136c1cSPekka Enberg 	rtc__init();
58364136c1cSPekka Enberg 
584f967c427SPrasad Joshi 	serial8250__init(kvm);
585f967c427SPrasad Joshi 
586f967c427SPrasad Joshi 	pci__init();
587f967c427SPrasad Joshi 
5881621292eSSasha Levin 	if (active_console == CONSOLE_VIRTIO)
589f967c427SPrasad Joshi 		virtio_console__init(kvm);
590f967c427SPrasad Joshi 
59153eca082SSasha Levin 	if (virtio_rng)
59280ac1d05SSasha Levin 		while (virtio_rng--)
59353eca082SSasha Levin 			virtio_rng__init(kvm);
59453eca082SSasha Levin 
5954f56d42cSAsias He 	if (!network)
5964f56d42cSAsias He 		network = DEFAULT_NETWORK;
5974f56d42cSAsias He 
598bdfcfca6SSasha Levin 	if (!strncmp(network, "virtio", 6)) {
599bdfcfca6SSasha Levin 		net_params = (struct virtio_net_parameters) {
600bdfcfca6SSasha Levin 			.host_ip = host_ip_addr,
60143835ac9SSasha Levin 			.kvm = kvm,
60273b7d038SAmos Kong 			.script = script
603bdfcfca6SSasha Levin 		};
604a4e724ddSSasha Levin 		sscanf(guest_mac,	"%hhx:%hhx:%hhx:%hhx:%hhx:%hhx",
605a4e724ddSSasha Levin 							net_params.guest_mac,
606a4e724ddSSasha Levin 							net_params.guest_mac+1,
607a4e724ddSSasha Levin 							net_params.guest_mac+2,
608a4e724ddSSasha Levin 							net_params.guest_mac+3,
609a4e724ddSSasha Levin 							net_params.guest_mac+4,
610a4e724ddSSasha Levin 							net_params.guest_mac+5);
611a4e724ddSSasha Levin 
612bdfcfca6SSasha Levin 		virtio_net__init(&net_params);
613bdfcfca6SSasha Levin 	}
6144f56d42cSAsias He 
615f967c427SPrasad Joshi 	kvm__start_timer(kvm);
616f967c427SPrasad Joshi 
6178ec7e042SSasha Levin 	kvm__setup_bios(kvm);
6188ec7e042SSasha Levin 
619d77a9efaSCyrill Gorcunov 	for (i = 0; i < nrcpus; i++) {
620d77a9efaSCyrill Gorcunov 		kvm_cpus[i] = kvm_cpu__init(kvm, i);
621d77a9efaSCyrill Gorcunov 		if (!kvm_cpus[i])
6225ee154d1SPekka Enberg 			die("unable to initialize KVM VCPU");
6235d1a249cSPekka Enberg 
6245ee154d1SPekka Enberg 		if (single_step)
625d77a9efaSCyrill Gorcunov 			kvm_cpu__enable_singlestep(kvm_cpus[i]);
626839051d9SSasha Levin 	}
6275ee154d1SPekka Enberg 
628839051d9SSasha Levin 	kvm__init_ram(kvm);
629839051d9SSasha Levin 
630*e342083cSJohn Floren 	if (vnc) {
631*e342083cSJohn Floren 		kbd__init(kvm);
6325ffd4178SJohn Floren 		vesa__init(kvm);
633*e342083cSJohn Floren 	}
6345ffd4178SJohn Floren 
635d60bafe5SSasha Levin 	thread_pool__init(nr_online_cpus);
63637f3d50eSSasha Levin 	ioeventfd__start();
637d60bafe5SSasha Levin 
638839051d9SSasha Levin 	for (i = 0; i < nrcpus; i++) {
639d77a9efaSCyrill Gorcunov 		if (pthread_create(&kvm_cpus[i]->thread, NULL, kvm_cpu_thread, kvm_cpus[i]) != 0)
6405ee154d1SPekka Enberg 			die("unable to create KVM VCPU thread");
6415ee154d1SPekka Enberg 	}
6425ee154d1SPekka Enberg 
64349e5227dSSasha Levin 	/* Only VCPU #0 is going to exit by itself when shutting down */
64449e5227dSSasha Levin 	if (pthread_join(kvm_cpus[0]->thread, &ret) != 0)
64549e5227dSSasha Levin 		exit_code = 1;
6465ee154d1SPekka Enberg 
64749e5227dSSasha Levin 	for (i = 1; i < nrcpus; i++) {
64849e5227dSSasha Levin 		pthread_kill(kvm_cpus[i]->thread, SIGKVMEXIT);
649d77a9efaSCyrill Gorcunov 		if (pthread_join(kvm_cpus[i]->thread, &ret) != 0)
6505ee154d1SPekka Enberg 			die("pthread_join");
6515ee154d1SPekka Enberg 
6525ee154d1SPekka Enberg 		if (ret != NULL)
6535ee154d1SPekka Enberg 			exit_code = 1;
6545ee154d1SPekka Enberg 	}
655f967c427SPrasad Joshi 
656a0a1e3c2SPrasad Joshi 	virtio_blk__delete_all(kvm);
65780ac1d05SSasha Levin 	virtio_rng__delete_all(kvm);
658a0a1e3c2SPrasad Joshi 
6599df47d00SPrasad Joshi 	disk_image__close_all(kvm->disks, image_count);
660f967c427SPrasad Joshi 	kvm__delete(kvm);
661f967c427SPrasad Joshi 
6625ee154d1SPekka Enberg 	if (!exit_code)
663f967c427SPrasad Joshi 		printf("\n  # KVM session ended normally.\n");
664f967c427SPrasad Joshi 
6655ee154d1SPekka Enberg 	return exit_code;
666f967c427SPrasad Joshi }
667