xref: /kvmtool/builtin-run.c (revision 2d96f6b6b1980f7d228c5a16f8bdba016c4503c0)
1f967c427SPrasad Joshi #include <stdio.h>
2f967c427SPrasad Joshi #include <string.h>
3f967c427SPrasad Joshi #include <signal.h>
4f967c427SPrasad Joshi #include <unistd.h>
5f967c427SPrasad Joshi #include <stdlib.h>
6f967c427SPrasad Joshi #include <termios.h>
78329f30bSPekka Enberg #include <sys/utsname.h>
88329f30bSPekka Enberg #include <sys/types.h>
98329f30bSPekka Enberg #include <sys/stat.h>
1026c853e4SPrasad Joshi #include <ctype.h>
11f967c427SPrasad Joshi 
12f967c427SPrasad Joshi /* user defined header files */
13f967c427SPrasad Joshi #include <linux/types.h>
14f967c427SPrasad Joshi #include <kvm/kvm.h>
155c3d55faSPekka Enberg #include <kvm/kvm-cpu.h>
16f967c427SPrasad Joshi #include <kvm/8250-serial.h>
17f967c427SPrasad Joshi #include <kvm/virtio-blk.h>
184f56d42cSAsias He #include <kvm/virtio-net.h>
19f967c427SPrasad Joshi #include <kvm/virtio-console.h>
2053eca082SSasha Levin #include <kvm/virtio-rng.h>
2182d2f21eSSasha Levin #include <kvm/virtio-balloon.h>
22f967c427SPrasad Joshi #include <kvm/disk-image.h>
23f967c427SPrasad Joshi #include <kvm/util.h>
24f967c427SPrasad Joshi #include <kvm/pci.h>
2564136c1cSPekka Enberg #include <kvm/rtc.h>
26f967c427SPrasad Joshi #include <kvm/term.h>
27ac38f433SPekka Enberg #include <kvm/ioport.h>
28d60bafe5SSasha Levin #include <kvm/threadpool.h>
29cffeab25SIngo Molnar #include <kvm/barrier.h>
30b0b42ba0SPekka Enberg #include <kvm/symbol.h>
311c7850f9SSasha Levin #include <kvm/virtio-9p.h>
325ffd4178SJohn Floren #include <kvm/vesa.h>
3337f3d50eSSasha Levin #include <kvm/ioeventfd.h>
34e342083cSJohn Floren #include <kvm/i8042.h>
35aba1efa5SPekka Enberg #include <kvm/vnc.h>
363f838fecSPekka Enberg #include <kvm/sdl.h>
37aba1efa5SPekka Enberg #include <kvm/framebuffer.h>
38f967c427SPrasad Joshi 
39f967c427SPrasad Joshi /* header files for gitish interface  */
40f967c427SPrasad Joshi #include <kvm/kvm-run.h>
41f967c427SPrasad Joshi #include <kvm/parse-options.h>
42b5b501ccSIngo Molnar #include <kvm/mutex.h>
43f967c427SPrasad Joshi 
44f967c427SPrasad Joshi #define DEFAULT_KVM_DEV		"/dev/kvm"
459aa4a0ebSAsias He #define DEFAULT_CONSOLE		"serial"
46bd30e200SAsias He #define DEFAULT_NETWORK		"user"
47745c7231SAsias He #define DEFAULT_HOST_ADDR	"192.168.33.1"
48a0db70d9SAsias He #define DEFAULT_GUEST_MAC	"00:15:15:15:15:15"
4973b7d038SAmos Kong #define DEFAULT_SCRIPT		"none"
50f967c427SPrasad Joshi 
51f967c427SPrasad Joshi #define MB_SHIFT		(20)
52a2a002f9SIngo Molnar #define MIN_RAM_SIZE_MB		(64ULL)
53f967c427SPrasad Joshi #define MIN_RAM_SIZE_BYTE	(MIN_RAM_SIZE_MB << MB_SHIFT)
54f967c427SPrasad Joshi 
554298ddadSSasha Levin struct kvm *kvm;
564298ddadSSasha Levin struct kvm_cpu *kvm_cpus[KVM_NR_CPUS];
57656be1b8SSasha Levin __thread struct kvm_cpu *current_kvm_cpu;
58f967c427SPrasad Joshi 
59fd834defSPekka Enberg static u64 ram_size;
60a33979d8SSasha Levin static u8  image_count;
6180ac1d05SSasha Levin static int virtio_rng;
62f967c427SPrasad Joshi static const char *kernel_cmdline;
63f967c427SPrasad Joshi static const char *kernel_filename;
64b0b42ba0SPekka Enberg static const char *vmlinux_filename;
65f967c427SPrasad Joshi static const char *initrd_filename;
66a33979d8SSasha Levin static const char *image_filename[MAX_DISK_IMAGES];
679aa4a0ebSAsias He static const char *console;
68f967c427SPrasad Joshi static const char *kvm_dev;
694f56d42cSAsias He static const char *network;
704d67c820SSasha Levin static const char *host_ip_addr;
71a4e724ddSSasha Levin static const char *guest_mac;
7273b7d038SAmos Kong static const char *script;
735358b0e6SSasha Levin static const char *guest_name;
740ea58e5bSPekka Enberg static bool single_step;
75a33979d8SSasha Levin static bool readonly_image[MAX_DISK_IMAGES];
765ffd4178SJohn Floren static bool vnc;
773f838fecSPekka Enberg static bool sdl;
7882d2f21eSSasha Levin static bool balloon;
79f967c427SPrasad Joshi extern bool ioport_debug;
80f967c427SPrasad Joshi extern int  active_console;
81aa400b00SPrasad Joshi extern int  debug_iodelay;
82f967c427SPrasad Joshi 
83ed036f03SCyrill Gorcunov bool do_debug_print = false;
84ed036f03SCyrill Gorcunov 
85cfd63bbbSSasha Levin static int nrcpus;
86890364f8SCyrill Gorcunov static int vidmode = -1;
87d77a9efaSCyrill Gorcunov 
88f967c427SPrasad Joshi static const char * const run_usage[] = {
898329f30bSPekka Enberg 	"kvm run [<options>] [<kernel image>]",
90f967c427SPrasad Joshi 	NULL
91f967c427SPrasad Joshi };
92f967c427SPrasad Joshi 
93a33979d8SSasha Levin static int img_name_parser(const struct option *opt, const char *arg, int unset)
94a33979d8SSasha Levin {
95a33979d8SSasha Levin 	char *sep;
96a33979d8SSasha Levin 
97a33979d8SSasha Levin 	if (image_count >= MAX_DISK_IMAGES)
98a33979d8SSasha Levin 		die("Currently only 4 images are supported");
99a33979d8SSasha Levin 
100a33979d8SSasha Levin 	image_filename[image_count] = arg;
101a33979d8SSasha Levin 	sep = strstr(arg, ",");
102a33979d8SSasha Levin 	if (sep) {
103a33979d8SSasha Levin 		if (strcmp(sep + 1, "ro") == 0)
104a33979d8SSasha Levin 			readonly_image[image_count] = 1;
105a33979d8SSasha Levin 		*sep = 0;
106a33979d8SSasha Levin 	}
107a33979d8SSasha Levin 
108a33979d8SSasha Levin 	image_count++;
109a33979d8SSasha Levin 
110a33979d8SSasha Levin 	return 0;
111a33979d8SSasha Levin }
112a33979d8SSasha Levin 
113b4422bf3SAneesh Kumar K.V static int virtio_9p_rootdir_parser(const struct option *opt, const char *arg, int unset)
114b4422bf3SAneesh Kumar K.V {
115b4422bf3SAneesh Kumar K.V 	char *tag_name;
116b4422bf3SAneesh Kumar K.V 	char tmp[PATH_MAX];
117b4422bf3SAneesh Kumar K.V 
118b4422bf3SAneesh Kumar K.V 	/*
119b4422bf3SAneesh Kumar K.V 	 * 9p dir can be of the form dirname,tag_name or
120b4422bf3SAneesh Kumar K.V 	 * just dirname. In the later case we use the
121b4422bf3SAneesh Kumar K.V 	 * default tag name
122b4422bf3SAneesh Kumar K.V 	 */
123b4422bf3SAneesh Kumar K.V 	tag_name = strstr(arg, ",");
124b4422bf3SAneesh Kumar K.V 	if (tag_name) {
125b4422bf3SAneesh Kumar K.V 		*tag_name = '\0';
126b4422bf3SAneesh Kumar K.V 		tag_name++;
127b4422bf3SAneesh Kumar K.V 	}
128b4422bf3SAneesh Kumar K.V 	if (realpath(arg, tmp))
129b4422bf3SAneesh Kumar K.V 		virtio_9p__init(kvm, tmp, tag_name);
130b4422bf3SAneesh Kumar K.V 	else
131b4422bf3SAneesh Kumar K.V 		die("Failed resolving 9p path");
132b4422bf3SAneesh Kumar K.V 	return 0;
133b4422bf3SAneesh Kumar K.V }
134b4422bf3SAneesh Kumar K.V 
135b4422bf3SAneesh Kumar K.V 
136f967c427SPrasad Joshi static const struct option options[] = {
1375e3af62dSSasha Levin 	OPT_GROUP("Basic options:"),
1385358b0e6SSasha Levin 	OPT_STRING('\0', "name", &guest_name, "guest name",
1395358b0e6SSasha Levin 			"A name for the guest"),
14080b1f72fSPekka Enberg 	OPT_INTEGER('c', "cpus", &nrcpus, "Number of CPUs"),
141f967c427SPrasad Joshi 	OPT_U64('m', "mem", &ram_size, "Virtual machine memory size in MiB."),
142d6c19027SAsias He 	OPT_CALLBACK('d', "disk", NULL, "image", "Disk image", img_name_parser),
14380b1f72fSPekka Enberg 	OPT_STRING('\0', "console", &console, "serial or virtio",
1445e3af62dSSasha Levin 			"Console to use"),
14580ac1d05SSasha Levin 	OPT_INCR('\0', "rng", &virtio_rng,
14653eca082SSasha Levin 			"Enable virtio Random Number Generator"),
147d6c19027SAsias He 	OPT_STRING('\0', "kvm-dev", &kvm_dev, "kvm-dev", "KVM device file"),
148b4422bf3SAneesh Kumar K.V 	OPT_CALLBACK('\0', "virtio-9p", NULL, "dirname,tag_name",
149b4422bf3SAneesh Kumar K.V 		     "Enable 9p over virtio", virtio_9p_rootdir_parser),
15082d2f21eSSasha Levin 	OPT_BOOLEAN('\0', "balloon", &balloon, "Enable virtio balloon"),
1515ffd4178SJohn Floren 	OPT_BOOLEAN('\0', "vnc", &vnc, "Enable VNC framebuffer"),
1523f838fecSPekka Enberg 	OPT_BOOLEAN('\0', "sdl", &sdl, "Enable SDL framebuffer"),
1535e3af62dSSasha Levin 
1545e3af62dSSasha Levin 	OPT_GROUP("Kernel options:"),
1555e3af62dSSasha Levin 	OPT_STRING('k', "kernel", &kernel_filename, "kernel",
1565e3af62dSSasha Levin 			"Kernel to boot in virtual machine"),
157d6c19027SAsias He 	OPT_STRING('i', "initrd", &initrd_filename, "initrd",
1585e3af62dSSasha Levin 			"Initial RAM disk image"),
1595e3af62dSSasha Levin 	OPT_STRING('p', "params", &kernel_cmdline, "params",
1605e3af62dSSasha Levin 			"Kernel command line arguments"),
1615e3af62dSSasha Levin 
1624d67c820SSasha Levin 	OPT_GROUP("Networking options:"),
163ec7674d7SAsias He 	OPT_STRING('n', "network", &network, "user, tap, none",
1644d67c820SSasha Levin 			"Network to use"),
1654d67c820SSasha Levin 	OPT_STRING('\0', "host-ip-addr", &host_ip_addr, "a.b.c.d",
1664d67c820SSasha Levin 			"Assign this address to the host side networking"),
167a4e724ddSSasha Levin 	OPT_STRING('\0', "guest-mac", &guest_mac, "aa:bb:cc:dd:ee:ff",
168a4e724ddSSasha Levin 			"Assign this address to the guest side NIC"),
16973b7d038SAmos Kong 	OPT_STRING('\0', "tapscript", &script, "Script path",
17073b7d038SAmos Kong 			 "Assign a script to process created tap device"),
171d6c19027SAsias He 
172890364f8SCyrill Gorcunov 	OPT_GROUP("BIOS options:"),
173890364f8SCyrill Gorcunov 	OPT_INTEGER('\0', "vidmode", &vidmode,
174890364f8SCyrill Gorcunov 		    "Video mode"),
175890364f8SCyrill Gorcunov 
1765e3af62dSSasha Levin 	OPT_GROUP("Debug options:"),
177ed036f03SCyrill Gorcunov 	OPT_BOOLEAN('\0', "debug", &do_debug_print,
178ed036f03SCyrill Gorcunov 			"Enable debug messages"),
179d6c19027SAsias He 	OPT_BOOLEAN('\0', "debug-single-step", &single_step,
180d6c19027SAsias He 			"Enable single stepping"),
181d6c19027SAsias He 	OPT_BOOLEAN('\0', "debug-ioport-debug", &ioport_debug,
182d6c19027SAsias He 			"Enable ioport debugging"),
183aa400b00SPrasad Joshi 	OPT_INTEGER('\0', "debug_iodelay", &debug_iodelay,
184aa400b00SPrasad Joshi 			"Delay IO by millisecond"),
185f967c427SPrasad Joshi 	OPT_END()
186f967c427SPrasad Joshi };
187f967c427SPrasad Joshi 
188b5b501ccSIngo Molnar /*
189b5b501ccSIngo Molnar  * Serialize debug printout so that the output of multiple vcpus does not
190b5b501ccSIngo Molnar  * get mixed up:
191b5b501ccSIngo Molnar  */
192cffeab25SIngo Molnar static int printout_done;
193b5b501ccSIngo Molnar 
19443119af7SPekka Enberg static void handle_sigusr1(int sig)
19543119af7SPekka Enberg {
19643119af7SPekka Enberg 	struct kvm_cpu *cpu = current_kvm_cpu;
19743119af7SPekka Enberg 
19843119af7SPekka Enberg 	if (!cpu)
19943119af7SPekka Enberg 		return;
20043119af7SPekka Enberg 
201b5b501ccSIngo Molnar 	printf("\n #\n # vCPU #%ld's dump:\n #\n", cpu->cpu_id);
20243119af7SPekka Enberg 	kvm_cpu__show_registers(cpu);
20343119af7SPekka Enberg 	kvm_cpu__show_code(cpu);
20443119af7SPekka Enberg 	kvm_cpu__show_page_tables(cpu);
205b5b501ccSIngo Molnar 	fflush(stdout);
206cffeab25SIngo Molnar 	printout_done = 1;
207cffeab25SIngo Molnar 	mb();
20843119af7SPekka Enberg }
20943119af7SPekka Enberg 
210d94e22b9SSasha Levin /* Pause/resume the guest using SIGUSR2 */
211d94e22b9SSasha Levin static int is_paused;
212d94e22b9SSasha Levin 
213d94e22b9SSasha Levin static void handle_sigusr2(int sig)
214d94e22b9SSasha Levin {
215d94e22b9SSasha Levin 	if (is_paused)
216d94e22b9SSasha Levin 		kvm__continue();
217d94e22b9SSasha Levin 	else
218d94e22b9SSasha Levin 		kvm__pause();
219d94e22b9SSasha Levin 
220d94e22b9SSasha Levin 	is_paused = !is_paused;
221d94e22b9SSasha Levin 	pr_info("Guest %s\n", is_paused ? "paused" : "resumed");
222d94e22b9SSasha Levin }
223d94e22b9SSasha Levin 
2249e854d1aSPekka Enberg static void handle_sigquit(int sig)
2259e854d1aSPekka Enberg {
2269e854d1aSPekka Enberg 	int i;
2279e854d1aSPekka Enberg 
2289e854d1aSPekka Enberg 	for (i = 0; i < nrcpus; i++) {
2299e854d1aSPekka Enberg 		struct kvm_cpu *cpu = kvm_cpus[i];
2309e854d1aSPekka Enberg 
23143119af7SPekka Enberg 		if (!cpu)
23243119af7SPekka Enberg 			continue;
23343119af7SPekka Enberg 
234cffeab25SIngo Molnar 		printout_done = 0;
23543119af7SPekka Enberg 		pthread_kill(cpu->thread, SIGUSR1);
236cffeab25SIngo Molnar 		/*
237cffeab25SIngo Molnar 		 * Wait for the vCPU to dump state before signalling
238cffeab25SIngo Molnar 		 * the next thread. Since this is debug code it does
239cffeab25SIngo Molnar 		 * not matter that we are burning CPU time a bit:
240cffeab25SIngo Molnar 		 */
241cffeab25SIngo Molnar 		while (!printout_done)
242cffeab25SIngo Molnar 			mb();
2439e854d1aSPekka Enberg 	}
2449e854d1aSPekka Enberg 
2459e854d1aSPekka Enberg 	serial8250__inject_sysrq(kvm);
2469e854d1aSPekka Enberg }
2479e854d1aSPekka Enberg 
2489e854d1aSPekka Enberg static void handle_sigalrm(int sig)
2499e854d1aSPekka Enberg {
2509e854d1aSPekka Enberg 	serial8250__inject_interrupt(kvm);
2519e854d1aSPekka Enberg 	virtio_console__inject_interrupt(kvm);
2529e854d1aSPekka Enberg }
2539e854d1aSPekka Enberg 
2545ee154d1SPekka Enberg static void *kvm_cpu_thread(void *arg)
2555ee154d1SPekka Enberg {
256d77a9efaSCyrill Gorcunov 	current_kvm_cpu		= arg;
2575ee154d1SPekka Enberg 
258d77a9efaSCyrill Gorcunov 	if (kvm_cpu__start(current_kvm_cpu))
2595ee154d1SPekka Enberg 		goto panic_kvm;
2605ee154d1SPekka Enberg 
261d77a9efaSCyrill Gorcunov 	kvm_cpu__delete(current_kvm_cpu);
2625ee154d1SPekka Enberg 
2635ee154d1SPekka Enberg 	return (void *) (intptr_t) 0;
2645ee154d1SPekka Enberg 
2655ee154d1SPekka Enberg panic_kvm:
2663fdf659dSSasha Levin 	fprintf(stderr, "KVM exit reason: %u (\"%s\")\n",
267d77a9efaSCyrill Gorcunov 		current_kvm_cpu->kvm_run->exit_reason,
268d77a9efaSCyrill Gorcunov 		kvm_exit_reasons[current_kvm_cpu->kvm_run->exit_reason]);
269d77a9efaSCyrill Gorcunov 	if (current_kvm_cpu->kvm_run->exit_reason == KVM_EXIT_UNKNOWN)
2705ee154d1SPekka Enberg 		fprintf(stderr, "KVM exit code: 0x%Lu\n",
271d77a9efaSCyrill Gorcunov 			current_kvm_cpu->kvm_run->hw.hardware_exit_reason);
2728e5accedSPekka Enberg 
273d77a9efaSCyrill Gorcunov 	kvm_cpu__show_registers(current_kvm_cpu);
274d77a9efaSCyrill Gorcunov 	kvm_cpu__show_code(current_kvm_cpu);
275d77a9efaSCyrill Gorcunov 	kvm_cpu__show_page_tables(current_kvm_cpu);
2765ee154d1SPekka Enberg 
277d77a9efaSCyrill Gorcunov 	kvm_cpu__delete(current_kvm_cpu);
2785ee154d1SPekka Enberg 
2795ee154d1SPekka Enberg 	return (void *) (intptr_t) 1;
2805ee154d1SPekka Enberg }
2815ee154d1SPekka Enberg 
282e08c0896SPrasad Joshi static char kernel[PATH_MAX];
283b0b42ba0SPekka Enberg 
284b0b42ba0SPekka Enberg static const char *host_kernels[] = {
285e08c0896SPrasad Joshi 	"/boot/vmlinuz",
286e08c0896SPrasad Joshi 	"/boot/bzImage",
287e08c0896SPrasad Joshi 	NULL
288e08c0896SPrasad Joshi };
289b0b42ba0SPekka Enberg 
290b0b42ba0SPekka Enberg static const char *default_kernels[] = {
291e08c0896SPrasad Joshi 	"./bzImage",
292e08c0896SPrasad Joshi 	"../../arch/x86/boot/bzImage",
293e08c0896SPrasad Joshi 	NULL
294e08c0896SPrasad Joshi };
2958329f30bSPekka Enberg 
296b0b42ba0SPekka Enberg static const char *default_vmlinux[] = {
297b0b42ba0SPekka Enberg 	"../../../vmlinux",
298b0b42ba0SPekka Enberg 	"../../vmlinux",
299b0b42ba0SPekka Enberg 	NULL
300b0b42ba0SPekka Enberg };
301b0b42ba0SPekka Enberg 
302e08c0896SPrasad Joshi static void kernel_usage_with_options(void)
3038329f30bSPekka Enberg {
304e08c0896SPrasad Joshi 	const char **k;
3058329f30bSPekka Enberg 	struct utsname uts;
306e08c0896SPrasad Joshi 
307e08c0896SPrasad Joshi 	fprintf(stderr, "Fatal: could not find default kernel image in:\n");
30865182f37SPrasad Joshi 	k = &default_kernels[0];
309e08c0896SPrasad Joshi 	while (*k) {
310e08c0896SPrasad Joshi 		fprintf(stderr, "\t%s\n", *k);
311e08c0896SPrasad Joshi 		k++;
312e08c0896SPrasad Joshi 	}
313e08c0896SPrasad Joshi 
314e08c0896SPrasad Joshi 	if (uname(&uts) < 0)
315e08c0896SPrasad Joshi 		return;
316e08c0896SPrasad Joshi 
317e08c0896SPrasad Joshi 	k = &host_kernels[0];
318e08c0896SPrasad Joshi 	while (*k) {
319e08c0896SPrasad Joshi 		if (snprintf(kernel, PATH_MAX, "%s-%s", *k, uts.release) < 0)
320e08c0896SPrasad Joshi 			return;
321e08c0896SPrasad Joshi 		fprintf(stderr, "\t%s\n", kernel);
322e08c0896SPrasad Joshi 		k++;
323e08c0896SPrasad Joshi 	}
324a33389d8SPrasad Joshi 	fprintf(stderr, "\nPlease see 'kvm run --help' for more options.\n\n");
325e08c0896SPrasad Joshi }
326e08c0896SPrasad Joshi 
32760ded003SPekka Enberg static u64 host_ram_size(void)
32860ded003SPekka Enberg {
32960ded003SPekka Enberg 	long page_size;
33060ded003SPekka Enberg 	long nr_pages;
33160ded003SPekka Enberg 
33260ded003SPekka Enberg 	nr_pages	= sysconf(_SC_PHYS_PAGES);
333d63c5ce6SPekka Enberg 	if (nr_pages < 0) {
3344542f276SCyrill Gorcunov 		pr_warning("sysconf(_SC_PHYS_PAGES) failed");
335d63c5ce6SPekka Enberg 		return 0;
336d63c5ce6SPekka Enberg 	}
33760ded003SPekka Enberg 
33860ded003SPekka Enberg 	page_size	= sysconf(_SC_PAGE_SIZE);
339d63c5ce6SPekka Enberg 	if (page_size < 0) {
3404542f276SCyrill Gorcunov 		pr_warning("sysconf(_SC_PAGE_SIZE) failed");
341d63c5ce6SPekka Enberg 		return 0;
342d63c5ce6SPekka Enberg 	}
34360ded003SPekka Enberg 
34460ded003SPekka Enberg 	return (nr_pages * page_size) >> MB_SHIFT;
34560ded003SPekka Enberg }
34660ded003SPekka Enberg 
34718bd8c3bSPekka Enberg /*
34818bd8c3bSPekka Enberg  * If user didn't specify how much memory it wants to allocate for the guest,
34918bd8c3bSPekka Enberg  * avoid filling the whole host RAM.
35018bd8c3bSPekka Enberg  */
35118bd8c3bSPekka Enberg #define RAM_SIZE_RATIO		0.8
35218bd8c3bSPekka Enberg 
353fd834defSPekka Enberg static u64 get_ram_size(int nr_cpus)
354fd834defSPekka Enberg {
35506761c76SPekka Enberg 	u64 available;
35606761c76SPekka Enberg 	u64 ram_size;
357fd834defSPekka Enberg 
358fd834defSPekka Enberg 	ram_size	= 64 * (nr_cpus + 3);
359fd834defSPekka Enberg 
36060ded003SPekka Enberg 	available	= host_ram_size() * RAM_SIZE_RATIO;
361d63c5ce6SPekka Enberg 	if (!available)
362d63c5ce6SPekka Enberg 		available = MIN_RAM_SIZE_MB;
363fd834defSPekka Enberg 
364fd834defSPekka Enberg 	if (ram_size > available)
365fd834defSPekka Enberg 		ram_size	= available;
366fd834defSPekka Enberg 
367fd834defSPekka Enberg 	return ram_size;
368fd834defSPekka Enberg }
369fd834defSPekka Enberg 
370e08c0896SPrasad Joshi static const char *find_kernel(void)
371e08c0896SPrasad Joshi {
372e08c0896SPrasad Joshi 	const char **k;
3738329f30bSPekka Enberg 	struct stat st;
374e08c0896SPrasad Joshi 	struct utsname uts;
375e08c0896SPrasad Joshi 
37665182f37SPrasad Joshi 	k = &default_kernels[0];
377e08c0896SPrasad Joshi 	while (*k) {
378e08c0896SPrasad Joshi 		if (stat(*k, &st) < 0 || !S_ISREG(st.st_mode)) {
379e08c0896SPrasad Joshi 			k++;
380e08c0896SPrasad Joshi 			continue;
381e08c0896SPrasad Joshi 		}
382e08c0896SPrasad Joshi 		strncpy(kernel, *k, PATH_MAX);
383e08c0896SPrasad Joshi 		return kernel;
384e08c0896SPrasad Joshi 	}
3858329f30bSPekka Enberg 
3868329f30bSPekka Enberg 	if (uname(&uts) < 0)
3878329f30bSPekka Enberg 		return NULL;
3888329f30bSPekka Enberg 
389e08c0896SPrasad Joshi 	k = &host_kernels[0];
390e08c0896SPrasad Joshi 	while (*k) {
391e08c0896SPrasad Joshi 		if (snprintf(kernel, PATH_MAX, "%s-%s", *k, uts.release) < 0)
3928329f30bSPekka Enberg 			return NULL;
3938329f30bSPekka Enberg 
394e08c0896SPrasad Joshi 		if (stat(kernel, &st) < 0 || !S_ISREG(st.st_mode)) {
395e08c0896SPrasad Joshi 			k++;
396e08c0896SPrasad Joshi 			continue;
397e08c0896SPrasad Joshi 		}
398e08c0896SPrasad Joshi 		return kernel;
3998329f30bSPekka Enberg 
400e08c0896SPrasad Joshi 	}
4018329f30bSPekka Enberg 	return NULL;
4028329f30bSPekka Enberg }
4038329f30bSPekka Enberg 
404b0b42ba0SPekka Enberg static const char *find_vmlinux(void)
405b0b42ba0SPekka Enberg {
406b0b42ba0SPekka Enberg 	const char **vmlinux;
407b0b42ba0SPekka Enberg 
408b0b42ba0SPekka Enberg 	vmlinux = &default_vmlinux[0];
409b0b42ba0SPekka Enberg 	while (*vmlinux) {
410b0b42ba0SPekka Enberg 		struct stat st;
411b0b42ba0SPekka Enberg 
412b0b42ba0SPekka Enberg 		if (stat(*vmlinux, &st) < 0 || !S_ISREG(st.st_mode)) {
413b0b42ba0SPekka Enberg 			vmlinux++;
414b0b42ba0SPekka Enberg 			continue;
415b0b42ba0SPekka Enberg 		}
416b0b42ba0SPekka Enberg 		return *vmlinux;
417b0b42ba0SPekka Enberg 	}
418b0b42ba0SPekka Enberg 	return NULL;
419b0b42ba0SPekka Enberg }
420b0b42ba0SPekka Enberg 
42126c853e4SPrasad Joshi static int root_device(char *dev, long *part)
42226c853e4SPrasad Joshi {
42326c853e4SPrasad Joshi 	struct stat st;
42426c853e4SPrasad Joshi 
42505088d56SSasha Levin 	if (stat("/", &st) < 0)
42626c853e4SPrasad Joshi 		return -1;
42726c853e4SPrasad Joshi 
42805088d56SSasha Levin 	*part = minor(st.st_dev);
42926c853e4SPrasad Joshi 
43005088d56SSasha Levin 	sprintf(dev, "/dev/block/%u:0", major(st.st_dev));
431afa0f6c1SPrasad Joshi 	if (access(dev, R_OK) < 0)
432afa0f6c1SPrasad Joshi 		return -1;
433afa0f6c1SPrasad Joshi 
43426c853e4SPrasad Joshi 	return 0;
43526c853e4SPrasad Joshi }
43626c853e4SPrasad Joshi 
43726c853e4SPrasad Joshi static char *host_image(char *cmd_line, size_t size)
43826c853e4SPrasad Joshi {
43926c853e4SPrasad Joshi 	char *t;
44026c853e4SPrasad Joshi 	char device[PATH_MAX];
44126c853e4SPrasad Joshi 	long part = 0;
44226c853e4SPrasad Joshi 
44326c853e4SPrasad Joshi 	t = malloc(PATH_MAX);
44426c853e4SPrasad Joshi 	if (!t)
44526c853e4SPrasad Joshi 		return NULL;
44626c853e4SPrasad Joshi 
44726c853e4SPrasad Joshi 	/* check for the root file system */
44826c853e4SPrasad Joshi 	if (root_device(device, &part) < 0) {
44926c853e4SPrasad Joshi 		free(t);
45026c853e4SPrasad Joshi 		return NULL;
45126c853e4SPrasad Joshi 	}
45226c853e4SPrasad Joshi 	strncpy(t, device, PATH_MAX);
45326c853e4SPrasad Joshi 	if (!strstr(cmd_line, "root=")) {
45426c853e4SPrasad Joshi 		char tmp[PATH_MAX];
45526c853e4SPrasad Joshi 		snprintf(tmp, sizeof(tmp), "root=/dev/vda%ld rw ", part);
45626c853e4SPrasad Joshi 		strlcat(cmd_line, tmp, size);
45726c853e4SPrasad Joshi 	}
45826c853e4SPrasad Joshi 	return t;
45926c853e4SPrasad Joshi }
46026c853e4SPrasad Joshi 
461f6677a1dSAmerigo Wang void kvm_run_help(void)
462f6677a1dSAmerigo Wang {
463f6677a1dSAmerigo Wang 	usage_with_options(run_usage, options);
464f6677a1dSAmerigo Wang }
465f6677a1dSAmerigo Wang 
466f967c427SPrasad Joshi int kvm_cmd_run(int argc, const char **argv, const char *prefix)
467f967c427SPrasad Joshi {
468b0b42ba0SPekka Enberg 	struct virtio_net_parameters net_params;
469*2d96f6b6SSasha Levin 	static char real_cmdline[2048], default_name[20];
470aba1efa5SPekka Enberg 	struct framebuffer *fb = NULL;
471384922b3SPekka Enberg 	unsigned int nr_online_cpus;
4725ee154d1SPekka Enberg 	int exit_code = 0;
473b0b42ba0SPekka Enberg 	int max_cpus;
47426c853e4SPrasad Joshi 	char *hi;
475b0b42ba0SPekka Enberg 	int i;
47649e5227dSSasha Levin 	void *ret;
477f967c427SPrasad Joshi 
4785ee154d1SPekka Enberg 	signal(SIGALRM, handle_sigalrm);
479f967c427SPrasad Joshi 	signal(SIGQUIT, handle_sigquit);
48043119af7SPekka Enberg 	signal(SIGUSR1, handle_sigusr1);
481d94e22b9SSasha Levin 	signal(SIGUSR2, handle_sigusr2);
482f967c427SPrasad Joshi 
483cfd63bbbSSasha Levin 	nr_online_cpus = sysconf(_SC_NPROCESSORS_ONLN);
484cfd63bbbSSasha Levin 
485f967c427SPrasad Joshi 	while (argc != 0) {
486f967c427SPrasad Joshi 		argc = parse_options(argc, argv, options, run_usage,
487f967c427SPrasad Joshi 				PARSE_OPT_STOP_AT_NON_OPTION);
488f967c427SPrasad Joshi 		if (argc != 0) {
489f967c427SPrasad Joshi 			if (kernel_filename) {
490f967c427SPrasad Joshi 				fprintf(stderr, "Cannot handle parameter: "
491f967c427SPrasad Joshi 						"%s\n", argv[0]);
492f967c427SPrasad Joshi 				usage_with_options(run_usage, options);
493f967c427SPrasad Joshi 				return EINVAL;
494f967c427SPrasad Joshi 			}
495f967c427SPrasad Joshi 			/* first unhandled parameter is treated as a kernel
496f967c427SPrasad Joshi 			   image
497f967c427SPrasad Joshi 			 */
498f967c427SPrasad Joshi 			kernel_filename = argv[0];
499f967c427SPrasad Joshi 			argv++;
500f967c427SPrasad Joshi 			argc--;
501f967c427SPrasad Joshi 		}
502f967c427SPrasad Joshi 
503f967c427SPrasad Joshi 	}
504f967c427SPrasad Joshi 
50545bc2f02SPekka Enberg 	if (!kernel_filename)
506e08c0896SPrasad Joshi 		kernel_filename = find_kernel();
5078329f30bSPekka Enberg 
5088329f30bSPekka Enberg 	if (!kernel_filename) {
509e08c0896SPrasad Joshi 		kernel_usage_with_options();
5108329f30bSPekka Enberg 		return EINVAL;
5118329f30bSPekka Enberg 	}
5128329f30bSPekka Enberg 
513b0b42ba0SPekka Enberg 	vmlinux_filename = find_vmlinux();
514b0b42ba0SPekka Enberg 
515cfd63bbbSSasha Levin 	if (nrcpus == 0)
516cfd63bbbSSasha Levin 		nrcpus = nr_online_cpus;
517cfd63bbbSSasha Levin 	else if (nrcpus < 1 || nrcpus > KVM_NR_CPUS)
518d77a9efaSCyrill Gorcunov 		die("Number of CPUs %d is out of [1;%d] range", nrcpus, KVM_NR_CPUS);
519d77a9efaSCyrill Gorcunov 
520fd834defSPekka Enberg 	if (!ram_size)
521fd834defSPekka Enberg 		ram_size	= get_ram_size(nrcpus);
522fd834defSPekka Enberg 
523a2a002f9SIngo Molnar 	if (ram_size < MIN_RAM_SIZE_MB)
524a2a002f9SIngo Molnar 		die("Not enough memory specified: %lluMB (min %lluMB)", ram_size, MIN_RAM_SIZE_MB);
525a2a002f9SIngo Molnar 
52660ded003SPekka Enberg 	if (ram_size > host_ram_size())
5274542f276SCyrill Gorcunov 		pr_warning("Guest memory size %lluMB exceeds host physical RAM size %lluMB", ram_size, host_ram_size());
52860ded003SPekka Enberg 
529f967c427SPrasad Joshi 	ram_size <<= MB_SHIFT;
530f967c427SPrasad Joshi 
531f967c427SPrasad Joshi 	if (!kvm_dev)
532f967c427SPrasad Joshi 		kvm_dev = DEFAULT_KVM_DEV;
533f967c427SPrasad Joshi 
5349aa4a0ebSAsias He 	if (!console)
5359aa4a0ebSAsias He 		console = DEFAULT_CONSOLE;
5369aa4a0ebSAsias He 
5379aa4a0ebSAsias He 	if (!strncmp(console, "virtio", 6))
538f967c427SPrasad Joshi 		active_console  = CONSOLE_VIRTIO;
5399aa4a0ebSAsias He 	else
5409aa4a0ebSAsias He 		active_console  = CONSOLE_8250;
541f967c427SPrasad Joshi 
5424d67c820SSasha Levin 	if (!host_ip_addr)
5434d67c820SSasha Levin 		host_ip_addr = DEFAULT_HOST_ADDR;
5444d67c820SSasha Levin 
545a4e724ddSSasha Levin 	if (!guest_mac)
546a4e724ddSSasha Levin 		guest_mac = DEFAULT_GUEST_MAC;
547a4e724ddSSasha Levin 
54873b7d038SAmos Kong 	if (!script)
54973b7d038SAmos Kong 		script = DEFAULT_SCRIPT;
55073b7d038SAmos Kong 
551b0b42ba0SPekka Enberg 	symbol__init(vmlinux_filename);
552b0b42ba0SPekka Enberg 
553f967c427SPrasad Joshi 	term_init();
554f967c427SPrasad Joshi 
555*2d96f6b6SSasha Levin 	if (!guest_name) {
556*2d96f6b6SSasha Levin 		sprintf(default_name, "guest-%u", getpid());
557*2d96f6b6SSasha Levin 		guest_name = default_name;
558*2d96f6b6SSasha Levin 	}
559*2d96f6b6SSasha Levin 
5605358b0e6SSasha Levin 	kvm = kvm__init(kvm_dev, ram_size, guest_name);
561f967c427SPrasad Joshi 
56237f3d50eSSasha Levin 	ioeventfd__init();
56337f3d50eSSasha Levin 
564384922b3SPekka Enberg 	max_cpus = kvm__max_cpus(kvm);
565384922b3SPekka Enberg 
566384922b3SPekka Enberg 	if (nrcpus > max_cpus) {
567384922b3SPekka Enberg 		printf("  # Limit the number of CPUs to %d\n", max_cpus);
568384922b3SPekka Enberg 		kvm->nrcpus	= max_cpus;
569384922b3SPekka Enberg 	}
570384922b3SPekka Enberg 
5710c7c14a7SCyrill Gorcunov 	kvm->nrcpus = nrcpus;
5720c7c14a7SCyrill Gorcunov 
573890364f8SCyrill Gorcunov 	/*
574890364f8SCyrill Gorcunov 	 * vidmode should be either specified
575890364f8SCyrill Gorcunov 	 * either set by default
576890364f8SCyrill Gorcunov 	 */
577890364f8SCyrill Gorcunov 	if (vnc || sdl) {
578890364f8SCyrill Gorcunov 		if (vidmode == -1)
579890364f8SCyrill Gorcunov 			vidmode = 0x312;
580890364f8SCyrill Gorcunov 	} else
581890364f8SCyrill Gorcunov 		vidmode = 0;
582890364f8SCyrill Gorcunov 
58326c853e4SPrasad Joshi 	memset(real_cmdline, 0, sizeof(real_cmdline));
584ea7016a9SPekka Enberg 	strcpy(real_cmdline, "notsc noapic noacpi pci=conf1 reboot=k panic=1");
5853f838fecSPekka Enberg 	if (vnc || sdl) {
5865ffd4178SJohn Floren 		strcat(real_cmdline, " video=vesafb console=tty0");
587890364f8SCyrill Gorcunov 	} else
5885ffd4178SJohn Floren 		strcat(real_cmdline, " console=ttyS0 earlyprintk=serial");
589d74181ccSSasha Levin 	strcat(real_cmdline, " ");
59026c853e4SPrasad Joshi 	if (kernel_cmdline)
59126c853e4SPrasad Joshi 		strlcat(real_cmdline, kernel_cmdline, sizeof(real_cmdline));
59226c853e4SPrasad Joshi 
59326c853e4SPrasad Joshi 	hi = NULL;
594a33979d8SSasha Levin 	if (!image_filename[0]) {
59526c853e4SPrasad Joshi 		hi = host_image(real_cmdline, sizeof(real_cmdline));
59626c853e4SPrasad Joshi 		if (hi) {
597a33979d8SSasha Levin 			image_filename[0] = hi;
598a33979d8SSasha Levin 			readonly_image[0] = true;
59925bf86f6SSasha Levin 			image_count++;
60026c853e4SPrasad Joshi 		}
60126c853e4SPrasad Joshi 	}
60226c853e4SPrasad Joshi 
60326c853e4SPrasad Joshi 	if (!strstr(real_cmdline, "root="))
60426c853e4SPrasad Joshi 		strlcat(real_cmdline, " root=/dev/vda rw ", sizeof(real_cmdline));
60526c853e4SPrasad Joshi 
606c1ed214eSPrasad Joshi 	if (image_count) {
607bcb6aacaSPrasad Joshi 		kvm->nr_disks = image_count;
608c1ed214eSPrasad Joshi 		kvm->disks    = disk_image__open_all(image_filename, readonly_image, image_count);
609c1ed214eSPrasad Joshi 		if (!kvm->disks)
610c1ed214eSPrasad Joshi 			die("Unable to load all disk images.");
61138605e1cSSasha Levin 
612bcb6aacaSPrasad Joshi 		virtio_blk__init_all(kvm);
613f967c427SPrasad Joshi 	}
614c1ed214eSPrasad Joshi 
61526c853e4SPrasad Joshi 	free(hi);
616f967c427SPrasad Joshi 
617*2d96f6b6SSasha Levin 	printf("  # kvm run -k %s -m %Lu -c %d --name %s\n", kernel_filename, ram_size / 1024 / 1024, nrcpus, guest_name);
618471c6facSPekka Enberg 
619f967c427SPrasad Joshi 	if (!kvm__load_kernel(kvm, kernel_filename, initrd_filename,
6205ffd4178SJohn Floren 				real_cmdline, vidmode))
621f967c427SPrasad Joshi 		die("unable to load kernel %s", kernel_filename);
622f967c427SPrasad Joshi 
623b0b42ba0SPekka Enberg 	kvm->vmlinux		= vmlinux_filename;
624b0b42ba0SPekka Enberg 
625ac38f433SPekka Enberg 	ioport__setup_legacy();
626ac38f433SPekka Enberg 
62764136c1cSPekka Enberg 	rtc__init();
62864136c1cSPekka Enberg 
629f967c427SPrasad Joshi 	serial8250__init(kvm);
630f967c427SPrasad Joshi 
631f967c427SPrasad Joshi 	pci__init();
632f967c427SPrasad Joshi 
6331621292eSSasha Levin 	if (active_console == CONSOLE_VIRTIO)
634f967c427SPrasad Joshi 		virtio_console__init(kvm);
635f967c427SPrasad Joshi 
63653eca082SSasha Levin 	if (virtio_rng)
63780ac1d05SSasha Levin 		while (virtio_rng--)
63853eca082SSasha Levin 			virtio_rng__init(kvm);
63953eca082SSasha Levin 
64082d2f21eSSasha Levin 	if (balloon)
64182d2f21eSSasha Levin 		virtio_bln__init(kvm);
64282d2f21eSSasha Levin 
6434f56d42cSAsias He 	if (!network)
6444f56d42cSAsias He 		network = DEFAULT_NETWORK;
6454f56d42cSAsias He 
646ec7674d7SAsias He 	if (strncmp(network, "none", 4)) {
647ec7674d7SAsias He 		net_params.host_ip = host_ip_addr;
648ec7674d7SAsias He 		net_params.kvm = kvm;
649ec7674d7SAsias He 		net_params.script = script;
650a4e724ddSSasha Levin 		sscanf(guest_mac, "%hhx:%hhx:%hhx:%hhx:%hhx:%hhx",
651a4e724ddSSasha Levin 			net_params.guest_mac,
652a4e724ddSSasha Levin 			net_params.guest_mac+1,
653a4e724ddSSasha Levin 			net_params.guest_mac+2,
654a4e724ddSSasha Levin 			net_params.guest_mac+3,
655a4e724ddSSasha Levin 			net_params.guest_mac+4,
656a4e724ddSSasha Levin 			net_params.guest_mac+5);
657a4e724ddSSasha Levin 
658ec7674d7SAsias He 		if (!strncmp(network, "user", 4))
659ec7674d7SAsias He 			net_params.mode = NET_MODE_USER;
660ec7674d7SAsias He 		else if (!strncmp(network, "tap", 3))
661ec7674d7SAsias He 			net_params.mode = NET_MODE_TAP;
662ec7674d7SAsias He 		else
663ec7674d7SAsias He 			die("Unkown network mode %s, please use -network user, tap, none", network);
664bdfcfca6SSasha Levin 		virtio_net__init(&net_params);
665bdfcfca6SSasha Levin 	}
6664f56d42cSAsias He 
667f967c427SPrasad Joshi 	kvm__start_timer(kvm);
668f967c427SPrasad Joshi 
6698ec7e042SSasha Levin 	kvm__setup_bios(kvm);
6708ec7e042SSasha Levin 
671d77a9efaSCyrill Gorcunov 	for (i = 0; i < nrcpus; i++) {
672d77a9efaSCyrill Gorcunov 		kvm_cpus[i] = kvm_cpu__init(kvm, i);
673d77a9efaSCyrill Gorcunov 		if (!kvm_cpus[i])
6745ee154d1SPekka Enberg 			die("unable to initialize KVM VCPU");
6755d1a249cSPekka Enberg 
6765ee154d1SPekka Enberg 		if (single_step)
677d77a9efaSCyrill Gorcunov 			kvm_cpu__enable_singlestep(kvm_cpus[i]);
678839051d9SSasha Levin 	}
6795ee154d1SPekka Enberg 
680839051d9SSasha Levin 	kvm__init_ram(kvm);
681839051d9SSasha Levin 
682714e5b7fSSasha Levin 	kbd__init(kvm);
683714e5b7fSSasha Levin 
6843f838fecSPekka Enberg 	if (vnc || sdl)
6853f838fecSPekka Enberg 		fb = vesa__init(kvm);
6863f838fecSPekka Enberg 
687e342083cSJohn Floren 	if (vnc) {
688aba1efa5SPekka Enberg 		if (fb)
689aba1efa5SPekka Enberg 			vnc__init(fb);
6903f838fecSPekka Enberg 	}
6913f838fecSPekka Enberg 
6923f838fecSPekka Enberg 	if (sdl) {
6933f838fecSPekka Enberg 		if (fb)
6943f838fecSPekka Enberg 			sdl__init(fb);
6953f838fecSPekka Enberg 	}
696aba1efa5SPekka Enberg 
697aba1efa5SPekka Enberg 	fb__start();
698aba1efa5SPekka Enberg 
699d60bafe5SSasha Levin 	thread_pool__init(nr_online_cpus);
70037f3d50eSSasha Levin 	ioeventfd__start();
701d60bafe5SSasha Levin 
702839051d9SSasha Levin 	for (i = 0; i < nrcpus; i++) {
703d77a9efaSCyrill Gorcunov 		if (pthread_create(&kvm_cpus[i]->thread, NULL, kvm_cpu_thread, kvm_cpus[i]) != 0)
7045ee154d1SPekka Enberg 			die("unable to create KVM VCPU thread");
7055ee154d1SPekka Enberg 	}
7065ee154d1SPekka Enberg 
70749e5227dSSasha Levin 	/* Only VCPU #0 is going to exit by itself when shutting down */
70849e5227dSSasha Levin 	if (pthread_join(kvm_cpus[0]->thread, &ret) != 0)
70949e5227dSSasha Levin 		exit_code = 1;
7105ee154d1SPekka Enberg 
71149e5227dSSasha Levin 	for (i = 1; i < nrcpus; i++) {
71249e5227dSSasha Levin 		pthread_kill(kvm_cpus[i]->thread, SIGKVMEXIT);
713d77a9efaSCyrill Gorcunov 		if (pthread_join(kvm_cpus[i]->thread, &ret) != 0)
7145ee154d1SPekka Enberg 			die("pthread_join");
7155ee154d1SPekka Enberg 
7165ee154d1SPekka Enberg 		if (ret != NULL)
7175ee154d1SPekka Enberg 			exit_code = 1;
7185ee154d1SPekka Enberg 	}
719f967c427SPrasad Joshi 
720aba1efa5SPekka Enberg 	fb__stop();
721aba1efa5SPekka Enberg 
722a0a1e3c2SPrasad Joshi 	virtio_blk__delete_all(kvm);
72380ac1d05SSasha Levin 	virtio_rng__delete_all(kvm);
724a0a1e3c2SPrasad Joshi 
7259df47d00SPrasad Joshi 	disk_image__close_all(kvm->disks, image_count);
726f967c427SPrasad Joshi 	kvm__delete(kvm);
727f967c427SPrasad Joshi 
7285ee154d1SPekka Enberg 	if (!exit_code)
729f967c427SPrasad Joshi 		printf("\n  # KVM session ended normally.\n");
730f967c427SPrasad Joshi 
7315ee154d1SPekka Enberg 	return exit_code;
732f967c427SPrasad Joshi }
733