xref: /kvmtool/virtio/balloon.c (revision fc835ab38f596bb9d2396a98e05d2e47e6ed235f)
182d2f21eSSasha Levin #include "kvm/virtio-balloon.h"
282d2f21eSSasha Levin 
382d2f21eSSasha Levin #include "kvm/virtio-pci-dev.h"
482d2f21eSSasha Levin 
582d2f21eSSasha Levin #include "kvm/virtio.h"
682d2f21eSSasha Levin #include "kvm/util.h"
782d2f21eSSasha Levin #include "kvm/kvm.h"
882d2f21eSSasha Levin #include "kvm/pci.h"
982d2f21eSSasha Levin #include "kvm/threadpool.h"
104b2e0a7aSSasha Levin #include "kvm/guest_compat.h"
1199c74cf9SSasha Levin #include "kvm/virtio-pci.h"
1282d2f21eSSasha Levin 
1382d2f21eSSasha Levin #include <linux/virtio_ring.h>
1482d2f21eSSasha Levin #include <linux/virtio_balloon.h>
1582d2f21eSSasha Levin 
1699c74cf9SSasha Levin #include <linux/kernel.h>
1782d2f21eSSasha Levin #include <linux/list.h>
1882d2f21eSSasha Levin #include <fcntl.h>
1982d2f21eSSasha Levin #include <sys/types.h>
2082d2f21eSSasha Levin #include <sys/stat.h>
2199c74cf9SSasha Levin #include <sys/mman.h>
2282d2f21eSSasha Levin #include <pthread.h>
231599d724SSasha Levin #include <sys/eventfd.h>
2482d2f21eSSasha Levin 
25bc10d2c1SSasha Levin #define NUM_VIRT_QUEUES		3
2682d2f21eSSasha Levin #define VIRTIO_BLN_QUEUE_SIZE	128
2782d2f21eSSasha Levin #define VIRTIO_BLN_INFLATE	0
2882d2f21eSSasha Levin #define VIRTIO_BLN_DEFLATE	1
29bc10d2c1SSasha Levin #define VIRTIO_BLN_STATS	2
3082d2f21eSSasha Levin 
3182d2f21eSSasha Levin struct bln_dev {
3282d2f21eSSasha Levin 	struct list_head	list;
3399c74cf9SSasha Levin 	struct virtio_pci	vpci;
3482d2f21eSSasha Levin 
3599c74cf9SSasha Levin 	u32			features;
3682d2f21eSSasha Levin 
3782d2f21eSSasha Levin 	/* virtio queue */
3882d2f21eSSasha Levin 	struct virt_queue	vqs[NUM_VIRT_QUEUES];
395cac5d9cSSasha Levin 	struct thread_pool__job	jobs[NUM_VIRT_QUEUES];
4082d2f21eSSasha Levin 
41bc10d2c1SSasha Levin 	struct virtio_balloon_stat stats[VIRTIO_BALLOON_S_NR];
42bc10d2c1SSasha Levin 	struct virtio_balloon_stat *cur_stat;
43bc10d2c1SSasha Levin 	u32			cur_stat_head;
44bc10d2c1SSasha Levin 	u16			stat_count;
45bc10d2c1SSasha Levin 	int			stat_waitfd;
46bc10d2c1SSasha Levin 
4782d2f21eSSasha Levin 	struct virtio_balloon_config config;
4882d2f21eSSasha Levin };
4982d2f21eSSasha Levin 
5082d2f21eSSasha Levin static struct bln_dev bdev;
5182d2f21eSSasha Levin extern struct kvm *kvm;
52312c62d1SSasha Levin static int compat_id = -1;
5382d2f21eSSasha Levin 
5482d2f21eSSasha Levin static bool virtio_bln_do_io_request(struct kvm *kvm, struct bln_dev *bdev, struct virt_queue *queue)
5582d2f21eSSasha Levin {
5682d2f21eSSasha Levin 	struct iovec iov[VIRTIO_BLN_QUEUE_SIZE];
5782d2f21eSSasha Levin 	unsigned int len = 0;
5882d2f21eSSasha Levin 	u16 out, in, head;
5982d2f21eSSasha Levin 	u32 *ptrs, i;
6082d2f21eSSasha Levin 
6182d2f21eSSasha Levin 	head		= virt_queue__get_iov(queue, iov, &out, &in, kvm);
6282d2f21eSSasha Levin 	ptrs		= iov[0].iov_base;
6382d2f21eSSasha Levin 	len		= iov[0].iov_len / sizeof(u32);
6482d2f21eSSasha Levin 
6582d2f21eSSasha Levin 	for (i = 0 ; i < len ; i++) {
6682d2f21eSSasha Levin 		void *guest_ptr;
6782d2f21eSSasha Levin 
6882d2f21eSSasha Levin 		guest_ptr = guest_flat_to_host(kvm, ptrs[i] << VIRTIO_BALLOON_PFN_SHIFT);
6982d2f21eSSasha Levin 		if (queue == &bdev->vqs[VIRTIO_BLN_INFLATE]) {
7082d2f21eSSasha Levin 			madvise(guest_ptr, 1 << VIRTIO_BALLOON_PFN_SHIFT, MADV_DONTNEED);
7182d2f21eSSasha Levin 			bdev->config.actual++;
72bc10d2c1SSasha Levin 		} else if (queue == &bdev->vqs[VIRTIO_BLN_DEFLATE]) {
7382d2f21eSSasha Levin 			bdev->config.actual--;
7482d2f21eSSasha Levin 		}
7582d2f21eSSasha Levin 	}
7682d2f21eSSasha Levin 
7782d2f21eSSasha Levin 	virt_queue__set_used_elem(queue, head, len);
7882d2f21eSSasha Levin 
7982d2f21eSSasha Levin 	return true;
8082d2f21eSSasha Levin }
8182d2f21eSSasha Levin 
82bc10d2c1SSasha Levin static bool virtio_bln_do_stat_request(struct kvm *kvm, struct bln_dev *bdev, struct virt_queue *queue)
83bc10d2c1SSasha Levin {
84bc10d2c1SSasha Levin 	struct iovec iov[VIRTIO_BLN_QUEUE_SIZE];
85bc10d2c1SSasha Levin 	u16 out, in, head;
86bc10d2c1SSasha Levin 	struct virtio_balloon_stat *stat;
87bc10d2c1SSasha Levin 	u64 wait_val = 1;
88bc10d2c1SSasha Levin 
89bc10d2c1SSasha Levin 	head = virt_queue__get_iov(queue, iov, &out, &in, kvm);
90bc10d2c1SSasha Levin 	stat = iov[0].iov_base;
91bc10d2c1SSasha Levin 
92bc10d2c1SSasha Levin 	/* Initial empty stat buffer */
93bc10d2c1SSasha Levin 	if (bdev->cur_stat == NULL) {
94bc10d2c1SSasha Levin 		bdev->cur_stat = stat;
95bc10d2c1SSasha Levin 		bdev->cur_stat_head = head;
96bc10d2c1SSasha Levin 
97bc10d2c1SSasha Levin 		return true;
98bc10d2c1SSasha Levin 	}
99bc10d2c1SSasha Levin 
100bc10d2c1SSasha Levin 	memcpy(bdev->stats, stat, iov[0].iov_len);
101bc10d2c1SSasha Levin 
102bc10d2c1SSasha Levin 	bdev->stat_count = iov[0].iov_len / sizeof(struct virtio_balloon_stat);
103bc10d2c1SSasha Levin 	bdev->cur_stat = stat;
104bc10d2c1SSasha Levin 	bdev->cur_stat_head = head;
105bc10d2c1SSasha Levin 
106bc10d2c1SSasha Levin 	if (write(bdev->stat_waitfd, &wait_val, sizeof(wait_val)) <= 0)
107bc10d2c1SSasha Levin 		return -EFAULT;
108bc10d2c1SSasha Levin 
109bc10d2c1SSasha Levin 	return 1;
110bc10d2c1SSasha Levin }
111bc10d2c1SSasha Levin 
11282d2f21eSSasha Levin static void virtio_bln_do_io(struct kvm *kvm, void *param)
11382d2f21eSSasha Levin {
11482d2f21eSSasha Levin 	struct virt_queue *vq = param;
11582d2f21eSSasha Levin 
116bc10d2c1SSasha Levin 	if (vq == &bdev.vqs[VIRTIO_BLN_STATS]) {
117bc10d2c1SSasha Levin 		virtio_bln_do_stat_request(kvm, &bdev, vq);
11899c74cf9SSasha Levin 		virtio_pci__signal_vq(kvm, &bdev.vpci, VIRTIO_BLN_STATS);
119bc10d2c1SSasha Levin 		return;
120bc10d2c1SSasha Levin 	}
121bc10d2c1SSasha Levin 
12282d2f21eSSasha Levin 	while (virt_queue__available(vq)) {
12382d2f21eSSasha Levin 		virtio_bln_do_io_request(kvm, &bdev, vq);
12499c74cf9SSasha Levin 		virtio_pci__signal_vq(kvm, &bdev.vpci, vq - bdev.vqs);
12582d2f21eSSasha Levin 	}
12682d2f21eSSasha Levin }
12782d2f21eSSasha Levin 
128bc10d2c1SSasha Levin static int virtio_bln__collect_stats(void)
129bc10d2c1SSasha Levin {
130bc10d2c1SSasha Levin 	u64 tmp;
131bc10d2c1SSasha Levin 
132bc10d2c1SSasha Levin 	virt_queue__set_used_elem(&bdev.vqs[VIRTIO_BLN_STATS], bdev.cur_stat_head,
133bc10d2c1SSasha Levin 				  sizeof(struct virtio_balloon_stat));
13499c74cf9SSasha Levin 	virtio_pci__signal_vq(kvm, &bdev.vpci, VIRTIO_BLN_STATS);
135bc10d2c1SSasha Levin 
136bc10d2c1SSasha Levin 	if (read(bdev.stat_waitfd, &tmp, sizeof(tmp)) <= 0)
137bc10d2c1SSasha Levin 		return -EFAULT;
138bc10d2c1SSasha Levin 
139bc10d2c1SSasha Levin 	return 0;
140bc10d2c1SSasha Levin }
141bc10d2c1SSasha Levin 
142bc10d2c1SSasha Levin static int virtio_bln__print_stats(void)
143bc10d2c1SSasha Levin {
144bc10d2c1SSasha Levin 	u16 i;
145bc10d2c1SSasha Levin 
146bc10d2c1SSasha Levin 	if (virtio_bln__collect_stats() < 0)
147bc10d2c1SSasha Levin 		return -EFAULT;
148bc10d2c1SSasha Levin 
149bc10d2c1SSasha Levin 	printf("\n\n\t*** Guest memory statistics ***\n\n");
150bc10d2c1SSasha Levin 	for (i = 0; i < bdev.stat_count; i++) {
151bc10d2c1SSasha Levin 		switch (bdev.stats[i].tag) {
152bc10d2c1SSasha Levin 		case VIRTIO_BALLOON_S_SWAP_IN:
153bc10d2c1SSasha Levin 			printf("The amount of memory that has been swapped in (in bytes):");
154bc10d2c1SSasha Levin 			break;
155bc10d2c1SSasha Levin 		case VIRTIO_BALLOON_S_SWAP_OUT:
156bc10d2c1SSasha Levin 			printf("The amount of memory that has been swapped out to disk (in bytes):");
157bc10d2c1SSasha Levin 			break;
158bc10d2c1SSasha Levin 		case VIRTIO_BALLOON_S_MAJFLT:
159bc10d2c1SSasha Levin 			printf("The number of major page faults that have occurred:");
160bc10d2c1SSasha Levin 			break;
161bc10d2c1SSasha Levin 		case VIRTIO_BALLOON_S_MINFLT:
162bc10d2c1SSasha Levin 			printf("The number of minor page faults that have occurred:");
163bc10d2c1SSasha Levin 			break;
164bc10d2c1SSasha Levin 		case VIRTIO_BALLOON_S_MEMFREE:
165bc10d2c1SSasha Levin 			printf("The amount of memory not being used for any purpose (in bytes):");
166bc10d2c1SSasha Levin 			break;
167bc10d2c1SSasha Levin 		case VIRTIO_BALLOON_S_MEMTOT:
168bc10d2c1SSasha Levin 			printf("The total amount of memory available (in bytes):");
169bc10d2c1SSasha Levin 			break;
170bc10d2c1SSasha Levin 		}
171bc10d2c1SSasha Levin 		printf("%llu\n", bdev.stats[i].val);
172bc10d2c1SSasha Levin 	}
173bc10d2c1SSasha Levin 	printf("\n");
174bc10d2c1SSasha Levin 
175bc10d2c1SSasha Levin 	return 0;
176bc10d2c1SSasha Levin }
177bc10d2c1SSasha Levin 
17882d2f21eSSasha Levin static void handle_sigmem(int sig)
17982d2f21eSSasha Levin {
18042bcd3eeSLiming Wang 	if (sig == SIGKVMADDMEM) {
18182d2f21eSSasha Levin 		bdev.config.num_pages += 256;
182bc10d2c1SSasha Levin 	} else if (sig == SIGKVMDELMEM) {
18342bcd3eeSLiming Wang 		if (bdev.config.num_pages < 256)
18442bcd3eeSLiming Wang 			return;
18542bcd3eeSLiming Wang 
18682d2f21eSSasha Levin 		bdev.config.num_pages -= 256;
187bc10d2c1SSasha Levin 	} else if (sig == SIGKVMMEMSTAT) {
188bc10d2c1SSasha Levin 		virtio_bln__print_stats();
189bc10d2c1SSasha Levin 
190bc10d2c1SSasha Levin 		return;
19142bcd3eeSLiming Wang 	}
19282d2f21eSSasha Levin 
19382d2f21eSSasha Levin 	/* Notify that the configuration space has changed */
19499c74cf9SSasha Levin 	virtio_pci__signal_config(kvm, &bdev.vpci);
19599c74cf9SSasha Levin }
19699c74cf9SSasha Levin 
19799c74cf9SSasha Levin static void set_config(struct kvm *kvm, void *dev, u8 data, u32 offset)
19899c74cf9SSasha Levin {
19999c74cf9SSasha Levin 	struct bln_dev *bdev = dev;
20099c74cf9SSasha Levin 
20199c74cf9SSasha Levin 	((u8 *)(&bdev->config))[offset] = data;
20299c74cf9SSasha Levin }
20399c74cf9SSasha Levin 
20499c74cf9SSasha Levin static u8 get_config(struct kvm *kvm, void *dev, u32 offset)
20599c74cf9SSasha Levin {
20699c74cf9SSasha Levin 	struct bln_dev *bdev = dev;
20799c74cf9SSasha Levin 
20899c74cf9SSasha Levin 	return ((u8 *)(&bdev->config))[offset];
20999c74cf9SSasha Levin }
21099c74cf9SSasha Levin 
21199c74cf9SSasha Levin static u32 get_host_features(struct kvm *kvm, void *dev)
21299c74cf9SSasha Levin {
21399c74cf9SSasha Levin 	return 1 << VIRTIO_BALLOON_F_STATS_VQ;
21499c74cf9SSasha Levin }
21599c74cf9SSasha Levin 
21699c74cf9SSasha Levin static void set_guest_features(struct kvm *kvm, void *dev, u32 features)
21799c74cf9SSasha Levin {
21899c74cf9SSasha Levin 	struct bln_dev *bdev = dev;
21999c74cf9SSasha Levin 
22099c74cf9SSasha Levin 	bdev->features = features;
22199c74cf9SSasha Levin }
22299c74cf9SSasha Levin 
22399c74cf9SSasha Levin static int init_vq(struct kvm *kvm, void *dev, u32 vq, u32 pfn)
22499c74cf9SSasha Levin {
22599c74cf9SSasha Levin 	struct bln_dev *bdev = dev;
22699c74cf9SSasha Levin 	struct virt_queue *queue;
22799c74cf9SSasha Levin 	void *p;
22899c74cf9SSasha Levin 
229312c62d1SSasha Levin 	compat__remove_message(compat_id);
23099c74cf9SSasha Levin 
23199c74cf9SSasha Levin 	queue			= &bdev->vqs[vq];
23299c74cf9SSasha Levin 	queue->pfn		= pfn;
23399c74cf9SSasha Levin 	p			= guest_pfn_to_host(kvm, queue->pfn);
23499c74cf9SSasha Levin 
23599c74cf9SSasha Levin 	thread_pool__init_job(&bdev->jobs[vq], kvm, virtio_bln_do_io, queue);
23699c74cf9SSasha Levin 	vring_init(&queue->vring, VIRTIO_BLN_QUEUE_SIZE, p, VIRTIO_PCI_VRING_ALIGN);
23799c74cf9SSasha Levin 
23899c74cf9SSasha Levin 	return 0;
23999c74cf9SSasha Levin }
24099c74cf9SSasha Levin 
24199c74cf9SSasha Levin static int notify_vq(struct kvm *kvm, void *dev, u32 vq)
24299c74cf9SSasha Levin {
24399c74cf9SSasha Levin 	struct bln_dev *bdev = dev;
24499c74cf9SSasha Levin 
24599c74cf9SSasha Levin 	thread_pool__do_job(&bdev->jobs[vq]);
24699c74cf9SSasha Levin 
24799c74cf9SSasha Levin 	return 0;
24899c74cf9SSasha Levin }
24999c74cf9SSasha Levin 
25099c74cf9SSasha Levin static int get_pfn_vq(struct kvm *kvm, void *dev, u32 vq)
25199c74cf9SSasha Levin {
25299c74cf9SSasha Levin 	struct bln_dev *bdev = dev;
25399c74cf9SSasha Levin 
25499c74cf9SSasha Levin 	return bdev->vqs[vq].pfn;
25599c74cf9SSasha Levin }
25699c74cf9SSasha Levin 
25799c74cf9SSasha Levin static int get_size_vq(struct kvm *kvm, void *dev, u32 vq)
25899c74cf9SSasha Levin {
25999c74cf9SSasha Levin 	return VIRTIO_BLN_QUEUE_SIZE;
26082d2f21eSSasha Levin }
26182d2f21eSSasha Levin 
26282d2f21eSSasha Levin void virtio_bln__init(struct kvm *kvm)
26382d2f21eSSasha Levin {
26482d2f21eSSasha Levin 	signal(SIGKVMADDMEM, handle_sigmem);
26582d2f21eSSasha Levin 	signal(SIGKVMDELMEM, handle_sigmem);
266bc10d2c1SSasha Levin 	signal(SIGKVMMEMSTAT, handle_sigmem);
26782d2f21eSSasha Levin 
268bc10d2c1SSasha Levin 	bdev.stat_waitfd	= eventfd(0, 0);
26982d2f21eSSasha Levin 	memset(&bdev.config, 0, sizeof(struct virtio_balloon_config));
27082d2f21eSSasha Levin 
27199c74cf9SSasha Levin 	virtio_pci__init(kvm, &bdev.vpci, &bdev, PCI_DEVICE_ID_VIRTIO_BLN, VIRTIO_ID_BALLOON);
27299c74cf9SSasha Levin 	bdev.vpci.ops = (struct virtio_pci_ops) {
27399c74cf9SSasha Levin 		.set_config		= set_config,
27499c74cf9SSasha Levin 		.get_config		= get_config,
27599c74cf9SSasha Levin 		.get_host_features	= get_host_features,
27699c74cf9SSasha Levin 		.set_guest_features	= set_guest_features,
27799c74cf9SSasha Levin 		.init_vq		= init_vq,
27899c74cf9SSasha Levin 		.notify_vq		= notify_vq,
27999c74cf9SSasha Levin 		.get_pfn_vq		= get_pfn_vq,
28099c74cf9SSasha Levin 		.get_size_vq		= get_size_vq,
28199c74cf9SSasha Levin 	};
2824b2e0a7aSSasha Levin 
283312c62d1SSasha Levin 	if (compat_id != -1)
284312c62d1SSasha Levin 		compat_id = compat__add_message("virtio-balloon device was not detected",
2854b2e0a7aSSasha Levin 						"While you have requested a virtio-balloon device, "
286*fc835ab3SSasha Levin 						"the guest kernel did not initialize it.\n"
287*fc835ab3SSasha Levin 						"Please make sure that the guest kernel was "
288*fc835ab3SSasha Levin 						"compiled with CONFIG_VIRTIO_BALLOON=y enabled "
289*fc835ab3SSasha Levin 						"in its .config");
29082d2f21eSSasha Levin }
291