xref: /kvmtool/builtin-run.c (revision bb8ffd2f848767bf40f9054a80805ade9d849f99)
1f967c427SPrasad Joshi #include <stdio.h>
2f967c427SPrasad Joshi #include <string.h>
3f967c427SPrasad Joshi #include <signal.h>
4f967c427SPrasad Joshi #include <unistd.h>
5f967c427SPrasad Joshi #include <stdlib.h>
6f967c427SPrasad Joshi #include <termios.h>
78329f30bSPekka Enberg #include <sys/utsname.h>
88329f30bSPekka Enberg #include <sys/types.h>
98329f30bSPekka Enberg #include <sys/stat.h>
1026c853e4SPrasad Joshi #include <ctype.h>
11f967c427SPrasad Joshi 
12f967c427SPrasad Joshi /* user defined header files */
13f967c427SPrasad Joshi #include <linux/types.h>
14f967c427SPrasad Joshi #include <kvm/kvm.h>
155c3d55faSPekka Enberg #include <kvm/kvm-cpu.h>
16f967c427SPrasad Joshi #include <kvm/8250-serial.h>
17f967c427SPrasad Joshi #include <kvm/virtio-blk.h>
184f56d42cSAsias He #include <kvm/virtio-net.h>
19f967c427SPrasad Joshi #include <kvm/virtio-console.h>
2053eca082SSasha Levin #include <kvm/virtio-rng.h>
2182d2f21eSSasha Levin #include <kvm/virtio-balloon.h>
22f967c427SPrasad Joshi #include <kvm/disk-image.h>
23f967c427SPrasad Joshi #include <kvm/util.h>
24f967c427SPrasad Joshi #include <kvm/pci.h>
2564136c1cSPekka Enberg #include <kvm/rtc.h>
26f967c427SPrasad Joshi #include <kvm/term.h>
27ac38f433SPekka Enberg #include <kvm/ioport.h>
28d60bafe5SSasha Levin #include <kvm/threadpool.h>
29cffeab25SIngo Molnar #include <kvm/barrier.h>
30b0b42ba0SPekka Enberg #include <kvm/symbol.h>
311c7850f9SSasha Levin #include <kvm/virtio-9p.h>
325ffd4178SJohn Floren #include <kvm/vesa.h>
3337f3d50eSSasha Levin #include <kvm/ioeventfd.h>
34e342083cSJohn Floren #include <kvm/i8042.h>
35aba1efa5SPekka Enberg #include <kvm/vnc.h>
363f838fecSPekka Enberg #include <kvm/sdl.h>
37aba1efa5SPekka Enberg #include <kvm/framebuffer.h>
38f967c427SPrasad Joshi 
39f967c427SPrasad Joshi /* header files for gitish interface  */
402a24f96dSSasha Levin #include <kvm/builtin-run.h>
41f967c427SPrasad Joshi #include <kvm/parse-options.h>
42b5b501ccSIngo Molnar #include <kvm/mutex.h>
43f967c427SPrasad Joshi 
44f967c427SPrasad Joshi #define DEFAULT_KVM_DEV		"/dev/kvm"
459aa4a0ebSAsias He #define DEFAULT_CONSOLE		"serial"
46bd30e200SAsias He #define DEFAULT_NETWORK		"user"
47745c7231SAsias He #define DEFAULT_HOST_ADDR	"192.168.33.1"
48*bb8ffd2fSAsias He #define DEFAULT_GUEST_ADDR	"192.168.33.15"
49a0db70d9SAsias He #define DEFAULT_GUEST_MAC	"00:15:15:15:15:15"
5073b7d038SAmos Kong #define DEFAULT_SCRIPT		"none"
51f967c427SPrasad Joshi 
52f967c427SPrasad Joshi #define MB_SHIFT		(20)
53a2a002f9SIngo Molnar #define MIN_RAM_SIZE_MB		(64ULL)
54f967c427SPrasad Joshi #define MIN_RAM_SIZE_BYTE	(MIN_RAM_SIZE_MB << MB_SHIFT)
55f967c427SPrasad Joshi 
564298ddadSSasha Levin struct kvm *kvm;
574298ddadSSasha Levin struct kvm_cpu *kvm_cpus[KVM_NR_CPUS];
58656be1b8SSasha Levin __thread struct kvm_cpu *current_kvm_cpu;
59f967c427SPrasad Joshi 
60fd834defSPekka Enberg static u64 ram_size;
61a33979d8SSasha Levin static u8  image_count;
6280ac1d05SSasha Levin static int virtio_rng;
63f967c427SPrasad Joshi static const char *kernel_cmdline;
64f967c427SPrasad Joshi static const char *kernel_filename;
65b0b42ba0SPekka Enberg static const char *vmlinux_filename;
66f967c427SPrasad Joshi static const char *initrd_filename;
67a33979d8SSasha Levin static const char *image_filename[MAX_DISK_IMAGES];
689aa4a0ebSAsias He static const char *console;
69f967c427SPrasad Joshi static const char *kvm_dev;
704f56d42cSAsias He static const char *network;
714d67c820SSasha Levin static const char *host_ip_addr;
72*bb8ffd2fSAsias He static const char *guest_ip;
73a4e724ddSSasha Levin static const char *guest_mac;
7473b7d038SAmos Kong static const char *script;
755358b0e6SSasha Levin static const char *guest_name;
760ea58e5bSPekka Enberg static bool single_step;
77a33979d8SSasha Levin static bool readonly_image[MAX_DISK_IMAGES];
785ffd4178SJohn Floren static bool vnc;
793f838fecSPekka Enberg static bool sdl;
8082d2f21eSSasha Levin static bool balloon;
81f967c427SPrasad Joshi extern bool ioport_debug;
82f967c427SPrasad Joshi extern int  active_console;
83aa400b00SPrasad Joshi extern int  debug_iodelay;
84f967c427SPrasad Joshi 
85ed036f03SCyrill Gorcunov bool do_debug_print = false;
86ed036f03SCyrill Gorcunov 
87cfd63bbbSSasha Levin static int nrcpus;
88890364f8SCyrill Gorcunov static int vidmode = -1;
89d77a9efaSCyrill Gorcunov 
90f967c427SPrasad Joshi static const char * const run_usage[] = {
918329f30bSPekka Enberg 	"kvm run [<options>] [<kernel image>]",
92f967c427SPrasad Joshi 	NULL
93f967c427SPrasad Joshi };
94f967c427SPrasad Joshi 
95a33979d8SSasha Levin static int img_name_parser(const struct option *opt, const char *arg, int unset)
96a33979d8SSasha Levin {
97a33979d8SSasha Levin 	char *sep;
98a33979d8SSasha Levin 
99a33979d8SSasha Levin 	if (image_count >= MAX_DISK_IMAGES)
100a33979d8SSasha Levin 		die("Currently only 4 images are supported");
101a33979d8SSasha Levin 
102a33979d8SSasha Levin 	image_filename[image_count] = arg;
103a33979d8SSasha Levin 	sep = strstr(arg, ",");
104a33979d8SSasha Levin 	if (sep) {
105a33979d8SSasha Levin 		if (strcmp(sep + 1, "ro") == 0)
106a33979d8SSasha Levin 			readonly_image[image_count] = 1;
107a33979d8SSasha Levin 		*sep = 0;
108a33979d8SSasha Levin 	}
109a33979d8SSasha Levin 
110a33979d8SSasha Levin 	image_count++;
111a33979d8SSasha Levin 
112a33979d8SSasha Levin 	return 0;
113a33979d8SSasha Levin }
114a33979d8SSasha Levin 
115b4422bf3SAneesh Kumar K.V static int virtio_9p_rootdir_parser(const struct option *opt, const char *arg, int unset)
116b4422bf3SAneesh Kumar K.V {
117b4422bf3SAneesh Kumar K.V 	char *tag_name;
118b4422bf3SAneesh Kumar K.V 	char tmp[PATH_MAX];
119b4422bf3SAneesh Kumar K.V 
120b4422bf3SAneesh Kumar K.V 	/*
121b4422bf3SAneesh Kumar K.V 	 * 9p dir can be of the form dirname,tag_name or
122b4422bf3SAneesh Kumar K.V 	 * just dirname. In the later case we use the
123b4422bf3SAneesh Kumar K.V 	 * default tag name
124b4422bf3SAneesh Kumar K.V 	 */
125b4422bf3SAneesh Kumar K.V 	tag_name = strstr(arg, ",");
126b4422bf3SAneesh Kumar K.V 	if (tag_name) {
127b4422bf3SAneesh Kumar K.V 		*tag_name = '\0';
128b4422bf3SAneesh Kumar K.V 		tag_name++;
129b4422bf3SAneesh Kumar K.V 	}
130b4422bf3SAneesh Kumar K.V 	if (realpath(arg, tmp))
131b4422bf3SAneesh Kumar K.V 		virtio_9p__init(kvm, tmp, tag_name);
132b4422bf3SAneesh Kumar K.V 	else
133b4422bf3SAneesh Kumar K.V 		die("Failed resolving 9p path");
134b4422bf3SAneesh Kumar K.V 	return 0;
135b4422bf3SAneesh Kumar K.V }
136b4422bf3SAneesh Kumar K.V 
137b4422bf3SAneesh Kumar K.V 
138f967c427SPrasad Joshi static const struct option options[] = {
1395e3af62dSSasha Levin 	OPT_GROUP("Basic options:"),
1405358b0e6SSasha Levin 	OPT_STRING('\0', "name", &guest_name, "guest name",
1415358b0e6SSasha Levin 			"A name for the guest"),
14280b1f72fSPekka Enberg 	OPT_INTEGER('c', "cpus", &nrcpus, "Number of CPUs"),
143f967c427SPrasad Joshi 	OPT_U64('m', "mem", &ram_size, "Virtual machine memory size in MiB."),
144d6c19027SAsias He 	OPT_CALLBACK('d', "disk", NULL, "image", "Disk image", img_name_parser),
14580b1f72fSPekka Enberg 	OPT_STRING('\0', "console", &console, "serial or virtio",
1465e3af62dSSasha Levin 			"Console to use"),
14780ac1d05SSasha Levin 	OPT_INCR('\0', "rng", &virtio_rng,
14853eca082SSasha Levin 			"Enable virtio Random Number Generator"),
149d6c19027SAsias He 	OPT_STRING('\0', "kvm-dev", &kvm_dev, "kvm-dev", "KVM device file"),
150b4422bf3SAneesh Kumar K.V 	OPT_CALLBACK('\0', "virtio-9p", NULL, "dirname,tag_name",
151b4422bf3SAneesh Kumar K.V 		     "Enable 9p over virtio", virtio_9p_rootdir_parser),
15282d2f21eSSasha Levin 	OPT_BOOLEAN('\0', "balloon", &balloon, "Enable virtio balloon"),
1535ffd4178SJohn Floren 	OPT_BOOLEAN('\0', "vnc", &vnc, "Enable VNC framebuffer"),
1543f838fecSPekka Enberg 	OPT_BOOLEAN('\0', "sdl", &sdl, "Enable SDL framebuffer"),
1555e3af62dSSasha Levin 
1565e3af62dSSasha Levin 	OPT_GROUP("Kernel options:"),
1575e3af62dSSasha Levin 	OPT_STRING('k', "kernel", &kernel_filename, "kernel",
1585e3af62dSSasha Levin 			"Kernel to boot in virtual machine"),
159d6c19027SAsias He 	OPT_STRING('i', "initrd", &initrd_filename, "initrd",
1605e3af62dSSasha Levin 			"Initial RAM disk image"),
1615e3af62dSSasha Levin 	OPT_STRING('p', "params", &kernel_cmdline, "params",
1625e3af62dSSasha Levin 			"Kernel command line arguments"),
1635e3af62dSSasha Levin 
1644d67c820SSasha Levin 	OPT_GROUP("Networking options:"),
165ec7674d7SAsias He 	OPT_STRING('n', "network", &network, "user, tap, none",
1664d67c820SSasha Levin 			"Network to use"),
1674d67c820SSasha Levin 	OPT_STRING('\0', "host-ip-addr", &host_ip_addr, "a.b.c.d",
1684d67c820SSasha Levin 			"Assign this address to the host side networking"),
169*bb8ffd2fSAsias He 	OPT_STRING('\0', "guest-ip", &guest_ip, "a.b.c.d",
170*bb8ffd2fSAsias He 			"Assign this address to the guest side networking"),
171a4e724ddSSasha Levin 	OPT_STRING('\0', "guest-mac", &guest_mac, "aa:bb:cc:dd:ee:ff",
172a4e724ddSSasha Levin 			"Assign this address to the guest side NIC"),
17373b7d038SAmos Kong 	OPT_STRING('\0', "tapscript", &script, "Script path",
17473b7d038SAmos Kong 			 "Assign a script to process created tap device"),
175d6c19027SAsias He 
176890364f8SCyrill Gorcunov 	OPT_GROUP("BIOS options:"),
177890364f8SCyrill Gorcunov 	OPT_INTEGER('\0', "vidmode", &vidmode,
178890364f8SCyrill Gorcunov 		    "Video mode"),
179890364f8SCyrill Gorcunov 
1805e3af62dSSasha Levin 	OPT_GROUP("Debug options:"),
181ed036f03SCyrill Gorcunov 	OPT_BOOLEAN('\0', "debug", &do_debug_print,
182ed036f03SCyrill Gorcunov 			"Enable debug messages"),
183d6c19027SAsias He 	OPT_BOOLEAN('\0', "debug-single-step", &single_step,
184d6c19027SAsias He 			"Enable single stepping"),
185001690a4SSasha Levin 	OPT_BOOLEAN('\0', "debug-ioport", &ioport_debug,
186d6c19027SAsias He 			"Enable ioport debugging"),
187001690a4SSasha Levin 	OPT_INTEGER('\0', "debug-iodelay", &debug_iodelay,
188aa400b00SPrasad Joshi 			"Delay IO by millisecond"),
189f967c427SPrasad Joshi 	OPT_END()
190f967c427SPrasad Joshi };
191f967c427SPrasad Joshi 
192b5b501ccSIngo Molnar /*
193b5b501ccSIngo Molnar  * Serialize debug printout so that the output of multiple vcpus does not
194b5b501ccSIngo Molnar  * get mixed up:
195b5b501ccSIngo Molnar  */
196cffeab25SIngo Molnar static int printout_done;
197b5b501ccSIngo Molnar 
19843119af7SPekka Enberg static void handle_sigusr1(int sig)
19943119af7SPekka Enberg {
20043119af7SPekka Enberg 	struct kvm_cpu *cpu = current_kvm_cpu;
20143119af7SPekka Enberg 
20243119af7SPekka Enberg 	if (!cpu)
20343119af7SPekka Enberg 		return;
20443119af7SPekka Enberg 
205b5b501ccSIngo Molnar 	printf("\n #\n # vCPU #%ld's dump:\n #\n", cpu->cpu_id);
20643119af7SPekka Enberg 	kvm_cpu__show_registers(cpu);
20743119af7SPekka Enberg 	kvm_cpu__show_code(cpu);
20843119af7SPekka Enberg 	kvm_cpu__show_page_tables(cpu);
209b5b501ccSIngo Molnar 	fflush(stdout);
210cffeab25SIngo Molnar 	printout_done = 1;
211cffeab25SIngo Molnar 	mb();
21243119af7SPekka Enberg }
21343119af7SPekka Enberg 
214d94e22b9SSasha Levin /* Pause/resume the guest using SIGUSR2 */
215d94e22b9SSasha Levin static int is_paused;
216d94e22b9SSasha Levin 
217d94e22b9SSasha Levin static void handle_sigusr2(int sig)
218d94e22b9SSasha Levin {
219d94e22b9SSasha Levin 	if (is_paused)
220d94e22b9SSasha Levin 		kvm__continue();
221d94e22b9SSasha Levin 	else
222d94e22b9SSasha Levin 		kvm__pause();
223d94e22b9SSasha Levin 
224d94e22b9SSasha Levin 	is_paused = !is_paused;
225d94e22b9SSasha Levin 	pr_info("Guest %s\n", is_paused ? "paused" : "resumed");
226d94e22b9SSasha Levin }
227d94e22b9SSasha Levin 
2289e854d1aSPekka Enberg static void handle_sigquit(int sig)
2299e854d1aSPekka Enberg {
2309e854d1aSPekka Enberg 	int i;
2319e854d1aSPekka Enberg 
2329e854d1aSPekka Enberg 	for (i = 0; i < nrcpus; i++) {
2339e854d1aSPekka Enberg 		struct kvm_cpu *cpu = kvm_cpus[i];
2349e854d1aSPekka Enberg 
23543119af7SPekka Enberg 		if (!cpu)
23643119af7SPekka Enberg 			continue;
23743119af7SPekka Enberg 
238cffeab25SIngo Molnar 		printout_done = 0;
23943119af7SPekka Enberg 		pthread_kill(cpu->thread, SIGUSR1);
240cffeab25SIngo Molnar 		/*
241cffeab25SIngo Molnar 		 * Wait for the vCPU to dump state before signalling
242cffeab25SIngo Molnar 		 * the next thread. Since this is debug code it does
243cffeab25SIngo Molnar 		 * not matter that we are burning CPU time a bit:
244cffeab25SIngo Molnar 		 */
245cffeab25SIngo Molnar 		while (!printout_done)
246cffeab25SIngo Molnar 			mb();
2479e854d1aSPekka Enberg 	}
2489e854d1aSPekka Enberg 
2499e854d1aSPekka Enberg 	serial8250__inject_sysrq(kvm);
2509e854d1aSPekka Enberg }
2519e854d1aSPekka Enberg 
2529e854d1aSPekka Enberg static void handle_sigalrm(int sig)
2539e854d1aSPekka Enberg {
2549e854d1aSPekka Enberg 	serial8250__inject_interrupt(kvm);
2559e854d1aSPekka Enberg 	virtio_console__inject_interrupt(kvm);
2569e854d1aSPekka Enberg }
2579e854d1aSPekka Enberg 
2585ee154d1SPekka Enberg static void *kvm_cpu_thread(void *arg)
2595ee154d1SPekka Enberg {
260d77a9efaSCyrill Gorcunov 	current_kvm_cpu		= arg;
2615ee154d1SPekka Enberg 
262d77a9efaSCyrill Gorcunov 	if (kvm_cpu__start(current_kvm_cpu))
2635ee154d1SPekka Enberg 		goto panic_kvm;
2645ee154d1SPekka Enberg 
265d77a9efaSCyrill Gorcunov 	kvm_cpu__delete(current_kvm_cpu);
2665ee154d1SPekka Enberg 
2675ee154d1SPekka Enberg 	return (void *) (intptr_t) 0;
2685ee154d1SPekka Enberg 
2695ee154d1SPekka Enberg panic_kvm:
2703fdf659dSSasha Levin 	fprintf(stderr, "KVM exit reason: %u (\"%s\")\n",
271d77a9efaSCyrill Gorcunov 		current_kvm_cpu->kvm_run->exit_reason,
272d77a9efaSCyrill Gorcunov 		kvm_exit_reasons[current_kvm_cpu->kvm_run->exit_reason]);
273d77a9efaSCyrill Gorcunov 	if (current_kvm_cpu->kvm_run->exit_reason == KVM_EXIT_UNKNOWN)
2745ee154d1SPekka Enberg 		fprintf(stderr, "KVM exit code: 0x%Lu\n",
275d77a9efaSCyrill Gorcunov 			current_kvm_cpu->kvm_run->hw.hardware_exit_reason);
2768e5accedSPekka Enberg 
277d77a9efaSCyrill Gorcunov 	kvm_cpu__show_registers(current_kvm_cpu);
278d77a9efaSCyrill Gorcunov 	kvm_cpu__show_code(current_kvm_cpu);
279d77a9efaSCyrill Gorcunov 	kvm_cpu__show_page_tables(current_kvm_cpu);
2805ee154d1SPekka Enberg 
281d77a9efaSCyrill Gorcunov 	kvm_cpu__delete(current_kvm_cpu);
2825ee154d1SPekka Enberg 
2835ee154d1SPekka Enberg 	return (void *) (intptr_t) 1;
2845ee154d1SPekka Enberg }
2855ee154d1SPekka Enberg 
286e08c0896SPrasad Joshi static char kernel[PATH_MAX];
287b0b42ba0SPekka Enberg 
288b0b42ba0SPekka Enberg static const char *host_kernels[] = {
289e08c0896SPrasad Joshi 	"/boot/vmlinuz",
290e08c0896SPrasad Joshi 	"/boot/bzImage",
291e08c0896SPrasad Joshi 	NULL
292e08c0896SPrasad Joshi };
293b0b42ba0SPekka Enberg 
294b0b42ba0SPekka Enberg static const char *default_kernels[] = {
295e08c0896SPrasad Joshi 	"./bzImage",
296e08c0896SPrasad Joshi 	"../../arch/x86/boot/bzImage",
297e08c0896SPrasad Joshi 	NULL
298e08c0896SPrasad Joshi };
2998329f30bSPekka Enberg 
300b0b42ba0SPekka Enberg static const char *default_vmlinux[] = {
301b0b42ba0SPekka Enberg 	"../../../vmlinux",
302b0b42ba0SPekka Enberg 	"../../vmlinux",
303b0b42ba0SPekka Enberg 	NULL
304b0b42ba0SPekka Enberg };
305b0b42ba0SPekka Enberg 
306e08c0896SPrasad Joshi static void kernel_usage_with_options(void)
3078329f30bSPekka Enberg {
308e08c0896SPrasad Joshi 	const char **k;
3098329f30bSPekka Enberg 	struct utsname uts;
310e08c0896SPrasad Joshi 
311e08c0896SPrasad Joshi 	fprintf(stderr, "Fatal: could not find default kernel image in:\n");
31265182f37SPrasad Joshi 	k = &default_kernels[0];
313e08c0896SPrasad Joshi 	while (*k) {
314e08c0896SPrasad Joshi 		fprintf(stderr, "\t%s\n", *k);
315e08c0896SPrasad Joshi 		k++;
316e08c0896SPrasad Joshi 	}
317e08c0896SPrasad Joshi 
318e08c0896SPrasad Joshi 	if (uname(&uts) < 0)
319e08c0896SPrasad Joshi 		return;
320e08c0896SPrasad Joshi 
321e08c0896SPrasad Joshi 	k = &host_kernels[0];
322e08c0896SPrasad Joshi 	while (*k) {
323e08c0896SPrasad Joshi 		if (snprintf(kernel, PATH_MAX, "%s-%s", *k, uts.release) < 0)
324e08c0896SPrasad Joshi 			return;
325e08c0896SPrasad Joshi 		fprintf(stderr, "\t%s\n", kernel);
326e08c0896SPrasad Joshi 		k++;
327e08c0896SPrasad Joshi 	}
328a33389d8SPrasad Joshi 	fprintf(stderr, "\nPlease see 'kvm run --help' for more options.\n\n");
329e08c0896SPrasad Joshi }
330e08c0896SPrasad Joshi 
33160ded003SPekka Enberg static u64 host_ram_size(void)
33260ded003SPekka Enberg {
33360ded003SPekka Enberg 	long page_size;
33460ded003SPekka Enberg 	long nr_pages;
33560ded003SPekka Enberg 
33660ded003SPekka Enberg 	nr_pages	= sysconf(_SC_PHYS_PAGES);
337d63c5ce6SPekka Enberg 	if (nr_pages < 0) {
3384542f276SCyrill Gorcunov 		pr_warning("sysconf(_SC_PHYS_PAGES) failed");
339d63c5ce6SPekka Enberg 		return 0;
340d63c5ce6SPekka Enberg 	}
34160ded003SPekka Enberg 
34260ded003SPekka Enberg 	page_size	= sysconf(_SC_PAGE_SIZE);
343d63c5ce6SPekka Enberg 	if (page_size < 0) {
3444542f276SCyrill Gorcunov 		pr_warning("sysconf(_SC_PAGE_SIZE) failed");
345d63c5ce6SPekka Enberg 		return 0;
346d63c5ce6SPekka Enberg 	}
34760ded003SPekka Enberg 
34860ded003SPekka Enberg 	return (nr_pages * page_size) >> MB_SHIFT;
34960ded003SPekka Enberg }
35060ded003SPekka Enberg 
35118bd8c3bSPekka Enberg /*
35218bd8c3bSPekka Enberg  * If user didn't specify how much memory it wants to allocate for the guest,
35318bd8c3bSPekka Enberg  * avoid filling the whole host RAM.
35418bd8c3bSPekka Enberg  */
35518bd8c3bSPekka Enberg #define RAM_SIZE_RATIO		0.8
35618bd8c3bSPekka Enberg 
357fd834defSPekka Enberg static u64 get_ram_size(int nr_cpus)
358fd834defSPekka Enberg {
35906761c76SPekka Enberg 	u64 available;
36006761c76SPekka Enberg 	u64 ram_size;
361fd834defSPekka Enberg 
362fd834defSPekka Enberg 	ram_size	= 64 * (nr_cpus + 3);
363fd834defSPekka Enberg 
36460ded003SPekka Enberg 	available	= host_ram_size() * RAM_SIZE_RATIO;
365d63c5ce6SPekka Enberg 	if (!available)
366d63c5ce6SPekka Enberg 		available = MIN_RAM_SIZE_MB;
367fd834defSPekka Enberg 
368fd834defSPekka Enberg 	if (ram_size > available)
369fd834defSPekka Enberg 		ram_size	= available;
370fd834defSPekka Enberg 
371fd834defSPekka Enberg 	return ram_size;
372fd834defSPekka Enberg }
373fd834defSPekka Enberg 
374e08c0896SPrasad Joshi static const char *find_kernel(void)
375e08c0896SPrasad Joshi {
376e08c0896SPrasad Joshi 	const char **k;
3778329f30bSPekka Enberg 	struct stat st;
378e08c0896SPrasad Joshi 	struct utsname uts;
379e08c0896SPrasad Joshi 
38065182f37SPrasad Joshi 	k = &default_kernels[0];
381e08c0896SPrasad Joshi 	while (*k) {
382e08c0896SPrasad Joshi 		if (stat(*k, &st) < 0 || !S_ISREG(st.st_mode)) {
383e08c0896SPrasad Joshi 			k++;
384e08c0896SPrasad Joshi 			continue;
385e08c0896SPrasad Joshi 		}
386e08c0896SPrasad Joshi 		strncpy(kernel, *k, PATH_MAX);
387e08c0896SPrasad Joshi 		return kernel;
388e08c0896SPrasad Joshi 	}
3898329f30bSPekka Enberg 
3908329f30bSPekka Enberg 	if (uname(&uts) < 0)
3918329f30bSPekka Enberg 		return NULL;
3928329f30bSPekka Enberg 
393e08c0896SPrasad Joshi 	k = &host_kernels[0];
394e08c0896SPrasad Joshi 	while (*k) {
395e08c0896SPrasad Joshi 		if (snprintf(kernel, PATH_MAX, "%s-%s", *k, uts.release) < 0)
3968329f30bSPekka Enberg 			return NULL;
3978329f30bSPekka Enberg 
398e08c0896SPrasad Joshi 		if (stat(kernel, &st) < 0 || !S_ISREG(st.st_mode)) {
399e08c0896SPrasad Joshi 			k++;
400e08c0896SPrasad Joshi 			continue;
401e08c0896SPrasad Joshi 		}
402e08c0896SPrasad Joshi 		return kernel;
4038329f30bSPekka Enberg 
404e08c0896SPrasad Joshi 	}
4058329f30bSPekka Enberg 	return NULL;
4068329f30bSPekka Enberg }
4078329f30bSPekka Enberg 
408b0b42ba0SPekka Enberg static const char *find_vmlinux(void)
409b0b42ba0SPekka Enberg {
410b0b42ba0SPekka Enberg 	const char **vmlinux;
411b0b42ba0SPekka Enberg 
412b0b42ba0SPekka Enberg 	vmlinux = &default_vmlinux[0];
413b0b42ba0SPekka Enberg 	while (*vmlinux) {
414b0b42ba0SPekka Enberg 		struct stat st;
415b0b42ba0SPekka Enberg 
416b0b42ba0SPekka Enberg 		if (stat(*vmlinux, &st) < 0 || !S_ISREG(st.st_mode)) {
417b0b42ba0SPekka Enberg 			vmlinux++;
418b0b42ba0SPekka Enberg 			continue;
419b0b42ba0SPekka Enberg 		}
420b0b42ba0SPekka Enberg 		return *vmlinux;
421b0b42ba0SPekka Enberg 	}
422b0b42ba0SPekka Enberg 	return NULL;
423b0b42ba0SPekka Enberg }
424b0b42ba0SPekka Enberg 
42526c853e4SPrasad Joshi static int root_device(char *dev, long *part)
42626c853e4SPrasad Joshi {
42726c853e4SPrasad Joshi 	struct stat st;
42826c853e4SPrasad Joshi 
42905088d56SSasha Levin 	if (stat("/", &st) < 0)
43026c853e4SPrasad Joshi 		return -1;
43126c853e4SPrasad Joshi 
43205088d56SSasha Levin 	*part = minor(st.st_dev);
43326c853e4SPrasad Joshi 
43405088d56SSasha Levin 	sprintf(dev, "/dev/block/%u:0", major(st.st_dev));
435afa0f6c1SPrasad Joshi 	if (access(dev, R_OK) < 0)
436afa0f6c1SPrasad Joshi 		return -1;
437afa0f6c1SPrasad Joshi 
43826c853e4SPrasad Joshi 	return 0;
43926c853e4SPrasad Joshi }
44026c853e4SPrasad Joshi 
44126c853e4SPrasad Joshi static char *host_image(char *cmd_line, size_t size)
44226c853e4SPrasad Joshi {
44326c853e4SPrasad Joshi 	char *t;
44426c853e4SPrasad Joshi 	char device[PATH_MAX];
44526c853e4SPrasad Joshi 	long part = 0;
44626c853e4SPrasad Joshi 
44726c853e4SPrasad Joshi 	t = malloc(PATH_MAX);
44826c853e4SPrasad Joshi 	if (!t)
44926c853e4SPrasad Joshi 		return NULL;
45026c853e4SPrasad Joshi 
45126c853e4SPrasad Joshi 	/* check for the root file system */
45226c853e4SPrasad Joshi 	if (root_device(device, &part) < 0) {
45326c853e4SPrasad Joshi 		free(t);
45426c853e4SPrasad Joshi 		return NULL;
45526c853e4SPrasad Joshi 	}
45626c853e4SPrasad Joshi 	strncpy(t, device, PATH_MAX);
45726c853e4SPrasad Joshi 	if (!strstr(cmd_line, "root=")) {
45826c853e4SPrasad Joshi 		char tmp[PATH_MAX];
45926c853e4SPrasad Joshi 		snprintf(tmp, sizeof(tmp), "root=/dev/vda%ld rw ", part);
46026c853e4SPrasad Joshi 		strlcat(cmd_line, tmp, size);
46126c853e4SPrasad Joshi 	}
46226c853e4SPrasad Joshi 	return t;
46326c853e4SPrasad Joshi }
46426c853e4SPrasad Joshi 
465f6677a1dSAmerigo Wang void kvm_run_help(void)
466f6677a1dSAmerigo Wang {
467f6677a1dSAmerigo Wang 	usage_with_options(run_usage, options);
468f6677a1dSAmerigo Wang }
469f6677a1dSAmerigo Wang 
470f967c427SPrasad Joshi int kvm_cmd_run(int argc, const char **argv, const char *prefix)
471f967c427SPrasad Joshi {
472b0b42ba0SPekka Enberg 	struct virtio_net_parameters net_params;
4732d96f6b6SSasha Levin 	static char real_cmdline[2048], default_name[20];
474aba1efa5SPekka Enberg 	struct framebuffer *fb = NULL;
475384922b3SPekka Enberg 	unsigned int nr_online_cpus;
4765ee154d1SPekka Enberg 	int exit_code = 0;
477b0b42ba0SPekka Enberg 	int max_cpus;
47826c853e4SPrasad Joshi 	char *hi;
479b0b42ba0SPekka Enberg 	int i;
48049e5227dSSasha Levin 	void *ret;
481f967c427SPrasad Joshi 
4825ee154d1SPekka Enberg 	signal(SIGALRM, handle_sigalrm);
483f967c427SPrasad Joshi 	signal(SIGQUIT, handle_sigquit);
48443119af7SPekka Enberg 	signal(SIGUSR1, handle_sigusr1);
485d94e22b9SSasha Levin 	signal(SIGUSR2, handle_sigusr2);
486f967c427SPrasad Joshi 
487cfd63bbbSSasha Levin 	nr_online_cpus = sysconf(_SC_NPROCESSORS_ONLN);
488cfd63bbbSSasha Levin 
489f967c427SPrasad Joshi 	while (argc != 0) {
490f967c427SPrasad Joshi 		argc = parse_options(argc, argv, options, run_usage,
491f967c427SPrasad Joshi 				PARSE_OPT_STOP_AT_NON_OPTION);
492f967c427SPrasad Joshi 		if (argc != 0) {
493f967c427SPrasad Joshi 			if (kernel_filename) {
494f967c427SPrasad Joshi 				fprintf(stderr, "Cannot handle parameter: "
495f967c427SPrasad Joshi 						"%s\n", argv[0]);
496f967c427SPrasad Joshi 				usage_with_options(run_usage, options);
497f967c427SPrasad Joshi 				return EINVAL;
498f967c427SPrasad Joshi 			}
499f967c427SPrasad Joshi 			/* first unhandled parameter is treated as a kernel
500f967c427SPrasad Joshi 			   image
501f967c427SPrasad Joshi 			 */
502f967c427SPrasad Joshi 			kernel_filename = argv[0];
503f967c427SPrasad Joshi 			argv++;
504f967c427SPrasad Joshi 			argc--;
505f967c427SPrasad Joshi 		}
506f967c427SPrasad Joshi 
507f967c427SPrasad Joshi 	}
508f967c427SPrasad Joshi 
50945bc2f02SPekka Enberg 	if (!kernel_filename)
510e08c0896SPrasad Joshi 		kernel_filename = find_kernel();
5118329f30bSPekka Enberg 
5128329f30bSPekka Enberg 	if (!kernel_filename) {
513e08c0896SPrasad Joshi 		kernel_usage_with_options();
5148329f30bSPekka Enberg 		return EINVAL;
5158329f30bSPekka Enberg 	}
5168329f30bSPekka Enberg 
517b0b42ba0SPekka Enberg 	vmlinux_filename = find_vmlinux();
518b0b42ba0SPekka Enberg 
519cfd63bbbSSasha Levin 	if (nrcpus == 0)
520cfd63bbbSSasha Levin 		nrcpus = nr_online_cpus;
521cfd63bbbSSasha Levin 	else if (nrcpus < 1 || nrcpus > KVM_NR_CPUS)
522d77a9efaSCyrill Gorcunov 		die("Number of CPUs %d is out of [1;%d] range", nrcpus, KVM_NR_CPUS);
523d77a9efaSCyrill Gorcunov 
524fd834defSPekka Enberg 	if (!ram_size)
525fd834defSPekka Enberg 		ram_size	= get_ram_size(nrcpus);
526fd834defSPekka Enberg 
527a2a002f9SIngo Molnar 	if (ram_size < MIN_RAM_SIZE_MB)
528a2a002f9SIngo Molnar 		die("Not enough memory specified: %lluMB (min %lluMB)", ram_size, MIN_RAM_SIZE_MB);
529a2a002f9SIngo Molnar 
53060ded003SPekka Enberg 	if (ram_size > host_ram_size())
5314542f276SCyrill Gorcunov 		pr_warning("Guest memory size %lluMB exceeds host physical RAM size %lluMB", ram_size, host_ram_size());
53260ded003SPekka Enberg 
533f967c427SPrasad Joshi 	ram_size <<= MB_SHIFT;
534f967c427SPrasad Joshi 
535f967c427SPrasad Joshi 	if (!kvm_dev)
536f967c427SPrasad Joshi 		kvm_dev = DEFAULT_KVM_DEV;
537f967c427SPrasad Joshi 
5389aa4a0ebSAsias He 	if (!console)
5399aa4a0ebSAsias He 		console = DEFAULT_CONSOLE;
5409aa4a0ebSAsias He 
5419aa4a0ebSAsias He 	if (!strncmp(console, "virtio", 6))
542f967c427SPrasad Joshi 		active_console  = CONSOLE_VIRTIO;
5439aa4a0ebSAsias He 	else
5449aa4a0ebSAsias He 		active_console  = CONSOLE_8250;
545f967c427SPrasad Joshi 
5464d67c820SSasha Levin 	if (!host_ip_addr)
5474d67c820SSasha Levin 		host_ip_addr = DEFAULT_HOST_ADDR;
5484d67c820SSasha Levin 
549*bb8ffd2fSAsias He 	if (!guest_ip)
550*bb8ffd2fSAsias He 		guest_ip = DEFAULT_GUEST_ADDR;
551*bb8ffd2fSAsias He 
552a4e724ddSSasha Levin 	if (!guest_mac)
553a4e724ddSSasha Levin 		guest_mac = DEFAULT_GUEST_MAC;
554a4e724ddSSasha Levin 
55573b7d038SAmos Kong 	if (!script)
55673b7d038SAmos Kong 		script = DEFAULT_SCRIPT;
55773b7d038SAmos Kong 
558b0b42ba0SPekka Enberg 	symbol__init(vmlinux_filename);
559b0b42ba0SPekka Enberg 
560f967c427SPrasad Joshi 	term_init();
561f967c427SPrasad Joshi 
5622d96f6b6SSasha Levin 	if (!guest_name) {
5632d96f6b6SSasha Levin 		sprintf(default_name, "guest-%u", getpid());
5642d96f6b6SSasha Levin 		guest_name = default_name;
5652d96f6b6SSasha Levin 	}
5662d96f6b6SSasha Levin 
5675358b0e6SSasha Levin 	kvm = kvm__init(kvm_dev, ram_size, guest_name);
568f967c427SPrasad Joshi 
5696d6a4d41SPekka Enberg 	kvm->single_step = single_step;
5706d6a4d41SPekka Enberg 
57137f3d50eSSasha Levin 	ioeventfd__init();
57237f3d50eSSasha Levin 
573384922b3SPekka Enberg 	max_cpus = kvm__max_cpus(kvm);
574384922b3SPekka Enberg 
575384922b3SPekka Enberg 	if (nrcpus > max_cpus) {
576384922b3SPekka Enberg 		printf("  # Limit the number of CPUs to %d\n", max_cpus);
577384922b3SPekka Enberg 		kvm->nrcpus	= max_cpus;
578384922b3SPekka Enberg 	}
579384922b3SPekka Enberg 
5800c7c14a7SCyrill Gorcunov 	kvm->nrcpus = nrcpus;
5810c7c14a7SCyrill Gorcunov 
582890364f8SCyrill Gorcunov 	/*
583890364f8SCyrill Gorcunov 	 * vidmode should be either specified
584890364f8SCyrill Gorcunov 	 * either set by default
585890364f8SCyrill Gorcunov 	 */
586890364f8SCyrill Gorcunov 	if (vnc || sdl) {
587890364f8SCyrill Gorcunov 		if (vidmode == -1)
588890364f8SCyrill Gorcunov 			vidmode = 0x312;
589890364f8SCyrill Gorcunov 	} else
590890364f8SCyrill Gorcunov 		vidmode = 0;
591890364f8SCyrill Gorcunov 
59226c853e4SPrasad Joshi 	memset(real_cmdline, 0, sizeof(real_cmdline));
593ea7016a9SPekka Enberg 	strcpy(real_cmdline, "notsc noapic noacpi pci=conf1 reboot=k panic=1");
5943f838fecSPekka Enberg 	if (vnc || sdl) {
5955ffd4178SJohn Floren 		strcat(real_cmdline, " video=vesafb console=tty0");
596890364f8SCyrill Gorcunov 	} else
5975ffd4178SJohn Floren 		strcat(real_cmdline, " console=ttyS0 earlyprintk=serial");
598d74181ccSSasha Levin 	strcat(real_cmdline, " ");
59926c853e4SPrasad Joshi 	if (kernel_cmdline)
60026c853e4SPrasad Joshi 		strlcat(real_cmdline, kernel_cmdline, sizeof(real_cmdline));
60126c853e4SPrasad Joshi 
60226c853e4SPrasad Joshi 	hi = NULL;
603a33979d8SSasha Levin 	if (!image_filename[0]) {
60426c853e4SPrasad Joshi 		hi = host_image(real_cmdline, sizeof(real_cmdline));
60526c853e4SPrasad Joshi 		if (hi) {
606a33979d8SSasha Levin 			image_filename[0] = hi;
607a33979d8SSasha Levin 			readonly_image[0] = true;
60825bf86f6SSasha Levin 			image_count++;
60926c853e4SPrasad Joshi 		}
61026c853e4SPrasad Joshi 	}
61126c853e4SPrasad Joshi 
61226c853e4SPrasad Joshi 	if (!strstr(real_cmdline, "root="))
61326c853e4SPrasad Joshi 		strlcat(real_cmdline, " root=/dev/vda rw ", sizeof(real_cmdline));
61426c853e4SPrasad Joshi 
615c1ed214eSPrasad Joshi 	if (image_count) {
616bcb6aacaSPrasad Joshi 		kvm->nr_disks = image_count;
617c1ed214eSPrasad Joshi 		kvm->disks    = disk_image__open_all(image_filename, readonly_image, image_count);
618c1ed214eSPrasad Joshi 		if (!kvm->disks)
619c1ed214eSPrasad Joshi 			die("Unable to load all disk images.");
62038605e1cSSasha Levin 
621bcb6aacaSPrasad Joshi 		virtio_blk__init_all(kvm);
622f967c427SPrasad Joshi 	}
623c1ed214eSPrasad Joshi 
62426c853e4SPrasad Joshi 	free(hi);
625f967c427SPrasad Joshi 
6262d96f6b6SSasha Levin 	printf("  # kvm run -k %s -m %Lu -c %d --name %s\n", kernel_filename, ram_size / 1024 / 1024, nrcpus, guest_name);
627471c6facSPekka Enberg 
628f967c427SPrasad Joshi 	if (!kvm__load_kernel(kvm, kernel_filename, initrd_filename,
6295ffd4178SJohn Floren 				real_cmdline, vidmode))
630f967c427SPrasad Joshi 		die("unable to load kernel %s", kernel_filename);
631f967c427SPrasad Joshi 
632b0b42ba0SPekka Enberg 	kvm->vmlinux		= vmlinux_filename;
633b0b42ba0SPekka Enberg 
634ac38f433SPekka Enberg 	ioport__setup_legacy();
635ac38f433SPekka Enberg 
63664136c1cSPekka Enberg 	rtc__init();
63764136c1cSPekka Enberg 
638f967c427SPrasad Joshi 	serial8250__init(kvm);
639f967c427SPrasad Joshi 
640f967c427SPrasad Joshi 	pci__init();
641f967c427SPrasad Joshi 
6421621292eSSasha Levin 	if (active_console == CONSOLE_VIRTIO)
643f967c427SPrasad Joshi 		virtio_console__init(kvm);
644f967c427SPrasad Joshi 
64553eca082SSasha Levin 	if (virtio_rng)
64680ac1d05SSasha Levin 		while (virtio_rng--)
64753eca082SSasha Levin 			virtio_rng__init(kvm);
64853eca082SSasha Levin 
64982d2f21eSSasha Levin 	if (balloon)
65082d2f21eSSasha Levin 		virtio_bln__init(kvm);
65182d2f21eSSasha Levin 
6524f56d42cSAsias He 	if (!network)
6534f56d42cSAsias He 		network = DEFAULT_NETWORK;
6544f56d42cSAsias He 
655ec7674d7SAsias He 	if (strncmp(network, "none", 4)) {
656ec7674d7SAsias He 		net_params.host_ip = host_ip_addr;
657*bb8ffd2fSAsias He 		net_params.guest_ip = guest_ip;
658ec7674d7SAsias He 		net_params.kvm = kvm;
659ec7674d7SAsias He 		net_params.script = script;
660a4e724ddSSasha Levin 		sscanf(guest_mac, "%hhx:%hhx:%hhx:%hhx:%hhx:%hhx",
661a4e724ddSSasha Levin 			net_params.guest_mac,
662a4e724ddSSasha Levin 			net_params.guest_mac+1,
663a4e724ddSSasha Levin 			net_params.guest_mac+2,
664a4e724ddSSasha Levin 			net_params.guest_mac+3,
665a4e724ddSSasha Levin 			net_params.guest_mac+4,
666a4e724ddSSasha Levin 			net_params.guest_mac+5);
667a4e724ddSSasha Levin 
668ec7674d7SAsias He 		if (!strncmp(network, "user", 4))
669ec7674d7SAsias He 			net_params.mode = NET_MODE_USER;
670ec7674d7SAsias He 		else if (!strncmp(network, "tap", 3))
671ec7674d7SAsias He 			net_params.mode = NET_MODE_TAP;
672ec7674d7SAsias He 		else
673ec7674d7SAsias He 			die("Unkown network mode %s, please use -network user, tap, none", network);
674bdfcfca6SSasha Levin 		virtio_net__init(&net_params);
675bdfcfca6SSasha Levin 	}
6764f56d42cSAsias He 
677f967c427SPrasad Joshi 	kvm__start_timer(kvm);
678f967c427SPrasad Joshi 
6798ec7e042SSasha Levin 	kvm__setup_bios(kvm);
6808ec7e042SSasha Levin 
681d77a9efaSCyrill Gorcunov 	for (i = 0; i < nrcpus; i++) {
682d77a9efaSCyrill Gorcunov 		kvm_cpus[i] = kvm_cpu__init(kvm, i);
683d77a9efaSCyrill Gorcunov 		if (!kvm_cpus[i])
6845ee154d1SPekka Enberg 			die("unable to initialize KVM VCPU");
685839051d9SSasha Levin 	}
6865ee154d1SPekka Enberg 
687839051d9SSasha Levin 	kvm__init_ram(kvm);
688839051d9SSasha Levin 
689714e5b7fSSasha Levin 	kbd__init(kvm);
690714e5b7fSSasha Levin 
6913f838fecSPekka Enberg 	if (vnc || sdl)
6923f838fecSPekka Enberg 		fb = vesa__init(kvm);
6933f838fecSPekka Enberg 
694e342083cSJohn Floren 	if (vnc) {
695aba1efa5SPekka Enberg 		if (fb)
696aba1efa5SPekka Enberg 			vnc__init(fb);
6973f838fecSPekka Enberg 	}
6983f838fecSPekka Enberg 
6993f838fecSPekka Enberg 	if (sdl) {
7003f838fecSPekka Enberg 		if (fb)
7013f838fecSPekka Enberg 			sdl__init(fb);
7023f838fecSPekka Enberg 	}
703aba1efa5SPekka Enberg 
704aba1efa5SPekka Enberg 	fb__start();
705aba1efa5SPekka Enberg 
706d60bafe5SSasha Levin 	thread_pool__init(nr_online_cpus);
70737f3d50eSSasha Levin 	ioeventfd__start();
708d60bafe5SSasha Levin 
709839051d9SSasha Levin 	for (i = 0; i < nrcpus; i++) {
710d77a9efaSCyrill Gorcunov 		if (pthread_create(&kvm_cpus[i]->thread, NULL, kvm_cpu_thread, kvm_cpus[i]) != 0)
7115ee154d1SPekka Enberg 			die("unable to create KVM VCPU thread");
7125ee154d1SPekka Enberg 	}
7135ee154d1SPekka Enberg 
71449e5227dSSasha Levin 	/* Only VCPU #0 is going to exit by itself when shutting down */
71549e5227dSSasha Levin 	if (pthread_join(kvm_cpus[0]->thread, &ret) != 0)
71649e5227dSSasha Levin 		exit_code = 1;
7175ee154d1SPekka Enberg 
71849e5227dSSasha Levin 	for (i = 1; i < nrcpus; i++) {
71949e5227dSSasha Levin 		pthread_kill(kvm_cpus[i]->thread, SIGKVMEXIT);
720d77a9efaSCyrill Gorcunov 		if (pthread_join(kvm_cpus[i]->thread, &ret) != 0)
7215ee154d1SPekka Enberg 			die("pthread_join");
7225ee154d1SPekka Enberg 
7235ee154d1SPekka Enberg 		if (ret != NULL)
7245ee154d1SPekka Enberg 			exit_code = 1;
7255ee154d1SPekka Enberg 	}
726f967c427SPrasad Joshi 
727aba1efa5SPekka Enberg 	fb__stop();
728aba1efa5SPekka Enberg 
729a0a1e3c2SPrasad Joshi 	virtio_blk__delete_all(kvm);
73080ac1d05SSasha Levin 	virtio_rng__delete_all(kvm);
731a0a1e3c2SPrasad Joshi 
7329df47d00SPrasad Joshi 	disk_image__close_all(kvm->disks, image_count);
733f967c427SPrasad Joshi 	kvm__delete(kvm);
734f967c427SPrasad Joshi 
7355ee154d1SPekka Enberg 	if (!exit_code)
736f967c427SPrasad Joshi 		printf("\n  # KVM session ended normally.\n");
737f967c427SPrasad Joshi 
7385ee154d1SPekka Enberg 	return exit_code;
739f967c427SPrasad Joshi }
740