182d2f21eSSasha Levin #include "kvm/virtio-balloon.h" 282d2f21eSSasha Levin 382d2f21eSSasha Levin #include "kvm/virtio-pci-dev.h" 482d2f21eSSasha Levin 582d2f21eSSasha Levin #include "kvm/virtio.h" 682d2f21eSSasha Levin #include "kvm/util.h" 782d2f21eSSasha Levin #include "kvm/kvm.h" 882d2f21eSSasha Levin #include "kvm/pci.h" 982d2f21eSSasha Levin #include "kvm/threadpool.h" 104b2e0a7aSSasha Levin #include "kvm/guest_compat.h" 1199c74cf9SSasha Levin #include "kvm/virtio-pci.h" 1282d2f21eSSasha Levin 1382d2f21eSSasha Levin #include <linux/virtio_ring.h> 1482d2f21eSSasha Levin #include <linux/virtio_balloon.h> 1582d2f21eSSasha Levin 1699c74cf9SSasha Levin #include <linux/kernel.h> 1782d2f21eSSasha Levin #include <linux/list.h> 1882d2f21eSSasha Levin #include <fcntl.h> 1982d2f21eSSasha Levin #include <sys/types.h> 2082d2f21eSSasha Levin #include <sys/stat.h> 2199c74cf9SSasha Levin #include <sys/mman.h> 2282d2f21eSSasha Levin #include <pthread.h> 231599d724SSasha Levin #include <sys/eventfd.h> 2482d2f21eSSasha Levin 25bc10d2c1SSasha Levin #define NUM_VIRT_QUEUES 3 2682d2f21eSSasha Levin #define VIRTIO_BLN_QUEUE_SIZE 128 2782d2f21eSSasha Levin #define VIRTIO_BLN_INFLATE 0 2882d2f21eSSasha Levin #define VIRTIO_BLN_DEFLATE 1 29bc10d2c1SSasha Levin #define VIRTIO_BLN_STATS 2 3082d2f21eSSasha Levin 3182d2f21eSSasha Levin struct bln_dev { 3282d2f21eSSasha Levin struct list_head list; 3399c74cf9SSasha Levin struct virtio_pci vpci; 3482d2f21eSSasha Levin 3599c74cf9SSasha Levin u32 features; 3682d2f21eSSasha Levin 3782d2f21eSSasha Levin /* virtio queue */ 3882d2f21eSSasha Levin struct virt_queue vqs[NUM_VIRT_QUEUES]; 395cac5d9cSSasha Levin struct thread_pool__job jobs[NUM_VIRT_QUEUES]; 4082d2f21eSSasha Levin 41bc10d2c1SSasha Levin struct virtio_balloon_stat stats[VIRTIO_BALLOON_S_NR]; 42bc10d2c1SSasha Levin struct virtio_balloon_stat *cur_stat; 43bc10d2c1SSasha Levin u32 cur_stat_head; 44bc10d2c1SSasha Levin u16 stat_count; 45bc10d2c1SSasha Levin int stat_waitfd; 46bc10d2c1SSasha Levin 4782d2f21eSSasha Levin struct virtio_balloon_config config; 4882d2f21eSSasha Levin }; 4982d2f21eSSasha Levin 5082d2f21eSSasha Levin static struct bln_dev bdev; 5182d2f21eSSasha Levin extern struct kvm *kvm; 52312c62d1SSasha Levin static int compat_id = -1; 5382d2f21eSSasha Levin 5482d2f21eSSasha Levin static bool virtio_bln_do_io_request(struct kvm *kvm, struct bln_dev *bdev, struct virt_queue *queue) 5582d2f21eSSasha Levin { 5682d2f21eSSasha Levin struct iovec iov[VIRTIO_BLN_QUEUE_SIZE]; 5782d2f21eSSasha Levin unsigned int len = 0; 5882d2f21eSSasha Levin u16 out, in, head; 5982d2f21eSSasha Levin u32 *ptrs, i; 6082d2f21eSSasha Levin 6182d2f21eSSasha Levin head = virt_queue__get_iov(queue, iov, &out, &in, kvm); 6282d2f21eSSasha Levin ptrs = iov[0].iov_base; 6382d2f21eSSasha Levin len = iov[0].iov_len / sizeof(u32); 6482d2f21eSSasha Levin 6582d2f21eSSasha Levin for (i = 0 ; i < len ; i++) { 6682d2f21eSSasha Levin void *guest_ptr; 6782d2f21eSSasha Levin 6882d2f21eSSasha Levin guest_ptr = guest_flat_to_host(kvm, ptrs[i] << VIRTIO_BALLOON_PFN_SHIFT); 6982d2f21eSSasha Levin if (queue == &bdev->vqs[VIRTIO_BLN_INFLATE]) { 7082d2f21eSSasha Levin madvise(guest_ptr, 1 << VIRTIO_BALLOON_PFN_SHIFT, MADV_DONTNEED); 7182d2f21eSSasha Levin bdev->config.actual++; 72bc10d2c1SSasha Levin } else if (queue == &bdev->vqs[VIRTIO_BLN_DEFLATE]) { 7382d2f21eSSasha Levin bdev->config.actual--; 7482d2f21eSSasha Levin } 7582d2f21eSSasha Levin } 7682d2f21eSSasha Levin 7782d2f21eSSasha Levin virt_queue__set_used_elem(queue, head, len); 7882d2f21eSSasha Levin 7982d2f21eSSasha Levin return true; 8082d2f21eSSasha Levin } 8182d2f21eSSasha Levin 82bc10d2c1SSasha Levin static bool virtio_bln_do_stat_request(struct kvm *kvm, struct bln_dev *bdev, struct virt_queue *queue) 83bc10d2c1SSasha Levin { 84bc10d2c1SSasha Levin struct iovec iov[VIRTIO_BLN_QUEUE_SIZE]; 85bc10d2c1SSasha Levin u16 out, in, head; 86bc10d2c1SSasha Levin struct virtio_balloon_stat *stat; 87bc10d2c1SSasha Levin u64 wait_val = 1; 88bc10d2c1SSasha Levin 89bc10d2c1SSasha Levin head = virt_queue__get_iov(queue, iov, &out, &in, kvm); 90bc10d2c1SSasha Levin stat = iov[0].iov_base; 91bc10d2c1SSasha Levin 92bc10d2c1SSasha Levin /* Initial empty stat buffer */ 93bc10d2c1SSasha Levin if (bdev->cur_stat == NULL) { 94bc10d2c1SSasha Levin bdev->cur_stat = stat; 95bc10d2c1SSasha Levin bdev->cur_stat_head = head; 96bc10d2c1SSasha Levin 97bc10d2c1SSasha Levin return true; 98bc10d2c1SSasha Levin } 99bc10d2c1SSasha Levin 100bc10d2c1SSasha Levin memcpy(bdev->stats, stat, iov[0].iov_len); 101bc10d2c1SSasha Levin 102bc10d2c1SSasha Levin bdev->stat_count = iov[0].iov_len / sizeof(struct virtio_balloon_stat); 103bc10d2c1SSasha Levin bdev->cur_stat = stat; 104bc10d2c1SSasha Levin bdev->cur_stat_head = head; 105bc10d2c1SSasha Levin 106bc10d2c1SSasha Levin if (write(bdev->stat_waitfd, &wait_val, sizeof(wait_val)) <= 0) 107bc10d2c1SSasha Levin return -EFAULT; 108bc10d2c1SSasha Levin 109bc10d2c1SSasha Levin return 1; 110bc10d2c1SSasha Levin } 111bc10d2c1SSasha Levin 11282d2f21eSSasha Levin static void virtio_bln_do_io(struct kvm *kvm, void *param) 11382d2f21eSSasha Levin { 11482d2f21eSSasha Levin struct virt_queue *vq = param; 11582d2f21eSSasha Levin 116bc10d2c1SSasha Levin if (vq == &bdev.vqs[VIRTIO_BLN_STATS]) { 117bc10d2c1SSasha Levin virtio_bln_do_stat_request(kvm, &bdev, vq); 11899c74cf9SSasha Levin virtio_pci__signal_vq(kvm, &bdev.vpci, VIRTIO_BLN_STATS); 119bc10d2c1SSasha Levin return; 120bc10d2c1SSasha Levin } 121bc10d2c1SSasha Levin 12282d2f21eSSasha Levin while (virt_queue__available(vq)) { 12382d2f21eSSasha Levin virtio_bln_do_io_request(kvm, &bdev, vq); 12499c74cf9SSasha Levin virtio_pci__signal_vq(kvm, &bdev.vpci, vq - bdev.vqs); 12582d2f21eSSasha Levin } 12682d2f21eSSasha Levin } 12782d2f21eSSasha Levin 128bc10d2c1SSasha Levin static int virtio_bln__collect_stats(void) 129bc10d2c1SSasha Levin { 130bc10d2c1SSasha Levin u64 tmp; 131bc10d2c1SSasha Levin 132bc10d2c1SSasha Levin virt_queue__set_used_elem(&bdev.vqs[VIRTIO_BLN_STATS], bdev.cur_stat_head, 133bc10d2c1SSasha Levin sizeof(struct virtio_balloon_stat)); 13499c74cf9SSasha Levin virtio_pci__signal_vq(kvm, &bdev.vpci, VIRTIO_BLN_STATS); 135bc10d2c1SSasha Levin 136bc10d2c1SSasha Levin if (read(bdev.stat_waitfd, &tmp, sizeof(tmp)) <= 0) 137bc10d2c1SSasha Levin return -EFAULT; 138bc10d2c1SSasha Levin 139bc10d2c1SSasha Levin return 0; 140bc10d2c1SSasha Levin } 141bc10d2c1SSasha Levin 142bc10d2c1SSasha Levin static int virtio_bln__print_stats(void) 143bc10d2c1SSasha Levin { 144bc10d2c1SSasha Levin u16 i; 145bc10d2c1SSasha Levin 146bc10d2c1SSasha Levin if (virtio_bln__collect_stats() < 0) 147bc10d2c1SSasha Levin return -EFAULT; 148bc10d2c1SSasha Levin 149bc10d2c1SSasha Levin printf("\n\n\t*** Guest memory statistics ***\n\n"); 150bc10d2c1SSasha Levin for (i = 0; i < bdev.stat_count; i++) { 151bc10d2c1SSasha Levin switch (bdev.stats[i].tag) { 152bc10d2c1SSasha Levin case VIRTIO_BALLOON_S_SWAP_IN: 153bc10d2c1SSasha Levin printf("The amount of memory that has been swapped in (in bytes):"); 154bc10d2c1SSasha Levin break; 155bc10d2c1SSasha Levin case VIRTIO_BALLOON_S_SWAP_OUT: 156bc10d2c1SSasha Levin printf("The amount of memory that has been swapped out to disk (in bytes):"); 157bc10d2c1SSasha Levin break; 158bc10d2c1SSasha Levin case VIRTIO_BALLOON_S_MAJFLT: 159bc10d2c1SSasha Levin printf("The number of major page faults that have occurred:"); 160bc10d2c1SSasha Levin break; 161bc10d2c1SSasha Levin case VIRTIO_BALLOON_S_MINFLT: 162bc10d2c1SSasha Levin printf("The number of minor page faults that have occurred:"); 163bc10d2c1SSasha Levin break; 164bc10d2c1SSasha Levin case VIRTIO_BALLOON_S_MEMFREE: 165bc10d2c1SSasha Levin printf("The amount of memory not being used for any purpose (in bytes):"); 166bc10d2c1SSasha Levin break; 167bc10d2c1SSasha Levin case VIRTIO_BALLOON_S_MEMTOT: 168bc10d2c1SSasha Levin printf("The total amount of memory available (in bytes):"); 169bc10d2c1SSasha Levin break; 170bc10d2c1SSasha Levin } 171bc10d2c1SSasha Levin printf("%llu\n", bdev.stats[i].val); 172bc10d2c1SSasha Levin } 173bc10d2c1SSasha Levin printf("\n"); 174bc10d2c1SSasha Levin 175bc10d2c1SSasha Levin return 0; 176bc10d2c1SSasha Levin } 177bc10d2c1SSasha Levin 17882d2f21eSSasha Levin static void handle_sigmem(int sig) 17982d2f21eSSasha Levin { 18042bcd3eeSLiming Wang if (sig == SIGKVMADDMEM) { 18182d2f21eSSasha Levin bdev.config.num_pages += 256; 182bc10d2c1SSasha Levin } else if (sig == SIGKVMDELMEM) { 18342bcd3eeSLiming Wang if (bdev.config.num_pages < 256) 18442bcd3eeSLiming Wang return; 18542bcd3eeSLiming Wang 18682d2f21eSSasha Levin bdev.config.num_pages -= 256; 187bc10d2c1SSasha Levin } else if (sig == SIGKVMMEMSTAT) { 188bc10d2c1SSasha Levin virtio_bln__print_stats(); 189bc10d2c1SSasha Levin 190bc10d2c1SSasha Levin return; 19142bcd3eeSLiming Wang } 19282d2f21eSSasha Levin 19382d2f21eSSasha Levin /* Notify that the configuration space has changed */ 19499c74cf9SSasha Levin virtio_pci__signal_config(kvm, &bdev.vpci); 19599c74cf9SSasha Levin } 19699c74cf9SSasha Levin 19799c74cf9SSasha Levin static void set_config(struct kvm *kvm, void *dev, u8 data, u32 offset) 19899c74cf9SSasha Levin { 19999c74cf9SSasha Levin struct bln_dev *bdev = dev; 20099c74cf9SSasha Levin 20199c74cf9SSasha Levin ((u8 *)(&bdev->config))[offset] = data; 20299c74cf9SSasha Levin } 20399c74cf9SSasha Levin 20499c74cf9SSasha Levin static u8 get_config(struct kvm *kvm, void *dev, u32 offset) 20599c74cf9SSasha Levin { 20699c74cf9SSasha Levin struct bln_dev *bdev = dev; 20799c74cf9SSasha Levin 20899c74cf9SSasha Levin return ((u8 *)(&bdev->config))[offset]; 20999c74cf9SSasha Levin } 21099c74cf9SSasha Levin 21199c74cf9SSasha Levin static u32 get_host_features(struct kvm *kvm, void *dev) 21299c74cf9SSasha Levin { 21399c74cf9SSasha Levin return 1 << VIRTIO_BALLOON_F_STATS_VQ; 21499c74cf9SSasha Levin } 21599c74cf9SSasha Levin 21699c74cf9SSasha Levin static void set_guest_features(struct kvm *kvm, void *dev, u32 features) 21799c74cf9SSasha Levin { 21899c74cf9SSasha Levin struct bln_dev *bdev = dev; 21999c74cf9SSasha Levin 22099c74cf9SSasha Levin bdev->features = features; 22199c74cf9SSasha Levin } 22299c74cf9SSasha Levin 22399c74cf9SSasha Levin static int init_vq(struct kvm *kvm, void *dev, u32 vq, u32 pfn) 22499c74cf9SSasha Levin { 22599c74cf9SSasha Levin struct bln_dev *bdev = dev; 22699c74cf9SSasha Levin struct virt_queue *queue; 22799c74cf9SSasha Levin void *p; 22899c74cf9SSasha Levin 229312c62d1SSasha Levin compat__remove_message(compat_id); 23099c74cf9SSasha Levin 23199c74cf9SSasha Levin queue = &bdev->vqs[vq]; 23299c74cf9SSasha Levin queue->pfn = pfn; 23399c74cf9SSasha Levin p = guest_pfn_to_host(kvm, queue->pfn); 23499c74cf9SSasha Levin 23599c74cf9SSasha Levin thread_pool__init_job(&bdev->jobs[vq], kvm, virtio_bln_do_io, queue); 23699c74cf9SSasha Levin vring_init(&queue->vring, VIRTIO_BLN_QUEUE_SIZE, p, VIRTIO_PCI_VRING_ALIGN); 23799c74cf9SSasha Levin 23899c74cf9SSasha Levin return 0; 23999c74cf9SSasha Levin } 24099c74cf9SSasha Levin 24199c74cf9SSasha Levin static int notify_vq(struct kvm *kvm, void *dev, u32 vq) 24299c74cf9SSasha Levin { 24399c74cf9SSasha Levin struct bln_dev *bdev = dev; 24499c74cf9SSasha Levin 24599c74cf9SSasha Levin thread_pool__do_job(&bdev->jobs[vq]); 24699c74cf9SSasha Levin 24799c74cf9SSasha Levin return 0; 24899c74cf9SSasha Levin } 24999c74cf9SSasha Levin 25099c74cf9SSasha Levin static int get_pfn_vq(struct kvm *kvm, void *dev, u32 vq) 25199c74cf9SSasha Levin { 25299c74cf9SSasha Levin struct bln_dev *bdev = dev; 25399c74cf9SSasha Levin 25499c74cf9SSasha Levin return bdev->vqs[vq].pfn; 25599c74cf9SSasha Levin } 25699c74cf9SSasha Levin 25799c74cf9SSasha Levin static int get_size_vq(struct kvm *kvm, void *dev, u32 vq) 25899c74cf9SSasha Levin { 25999c74cf9SSasha Levin return VIRTIO_BLN_QUEUE_SIZE; 26082d2f21eSSasha Levin } 26182d2f21eSSasha Levin 26282d2f21eSSasha Levin void virtio_bln__init(struct kvm *kvm) 26382d2f21eSSasha Levin { 26482d2f21eSSasha Levin signal(SIGKVMADDMEM, handle_sigmem); 26582d2f21eSSasha Levin signal(SIGKVMDELMEM, handle_sigmem); 266bc10d2c1SSasha Levin signal(SIGKVMMEMSTAT, handle_sigmem); 26782d2f21eSSasha Levin 268bc10d2c1SSasha Levin bdev.stat_waitfd = eventfd(0, 0); 26982d2f21eSSasha Levin memset(&bdev.config, 0, sizeof(struct virtio_balloon_config)); 27082d2f21eSSasha Levin 27199c74cf9SSasha Levin virtio_pci__init(kvm, &bdev.vpci, &bdev, PCI_DEVICE_ID_VIRTIO_BLN, VIRTIO_ID_BALLOON); 27299c74cf9SSasha Levin bdev.vpci.ops = (struct virtio_pci_ops) { 27399c74cf9SSasha Levin .set_config = set_config, 27499c74cf9SSasha Levin .get_config = get_config, 27599c74cf9SSasha Levin .get_host_features = get_host_features, 27699c74cf9SSasha Levin .set_guest_features = set_guest_features, 27799c74cf9SSasha Levin .init_vq = init_vq, 27899c74cf9SSasha Levin .notify_vq = notify_vq, 27999c74cf9SSasha Levin .get_pfn_vq = get_pfn_vq, 28099c74cf9SSasha Levin .get_size_vq = get_size_vq, 28199c74cf9SSasha Levin }; 2824b2e0a7aSSasha Levin 283312c62d1SSasha Levin if (compat_id != -1) 284312c62d1SSasha Levin compat_id = compat__add_message("virtio-balloon device was not detected", 2854b2e0a7aSSasha Levin "While you have requested a virtio-balloon device, " 286*fc835ab3SSasha Levin "the guest kernel did not initialize it.\n" 287*fc835ab3SSasha Levin "Please make sure that the guest kernel was " 288*fc835ab3SSasha Levin "compiled with CONFIG_VIRTIO_BALLOON=y enabled " 289*fc835ab3SSasha Levin "in its .config"); 29082d2f21eSSasha Levin } 291