1416b2c2dSAsias He #include "kvm/virtio-blk.h" 2b30d05adSPekka Enberg 331638bcaSCyrill Gorcunov #include "kvm/virtio-pci-dev.h" 45a24a9f2SPekka Enberg #include "kvm/disk-image.h" 54ef0f4d6SPekka Enberg #include "kvm/mutex.h" 6fe99fd4eSPekka Enberg #include "kvm/util.h" 78b1ff07eSPekka Enberg #include "kvm/kvm.h" 8b30d05adSPekka Enberg #include "kvm/pci.h" 9fb0957f2SSasha Levin #include "kvm/threadpool.h" 10ec75b82fSSasha Levin #include "kvm/ioeventfd.h" 11404d164bSSasha Levin #include "kvm/guest_compat.h" 12427948d5SSasha Levin #include "kvm/virtio-pci.h" 13*f41a132bSSasha Levin #include "kvm/virtio.h" 14b30d05adSPekka Enberg 1520c64ecaSPekka Enberg #include <linux/virtio_ring.h> 1620c64ecaSPekka Enberg #include <linux/virtio_blk.h> 17427948d5SSasha Levin #include <linux/kernel.h> 18ebe9ac19SSasha Levin #include <linux/list.h> 193fdf659dSSasha Levin #include <linux/types.h> 200528c2a7SPekka Enberg #include <pthread.h> 214155ba8cSPekka Enberg 224749e795SSasha Levin #define VIRTIO_BLK_MAX_DEV 4 2310eca11dSPekka Enberg 243d7831a1SAsias He /* 253d7831a1SAsias He * the header and status consume too entries 263d7831a1SAsias He */ 273d7831a1SAsias He #define DISK_SEG_MAX (VIRTIO_BLK_QUEUE_SIZE - 2) 28*f41a132bSSasha Levin #define VIRTIO_BLK_QUEUE_SIZE 128 29*f41a132bSSasha Levin #define NUM_VIRT_QUEUES 1 3010eca11dSPekka Enberg 318b52f877SSasha Levin struct blk_dev_req { 328b52f877SSasha Levin struct list_head list; 334749e795SSasha Levin struct virt_queue *vq; 34fe2a70d1SSasha Levin struct blk_dev *bdev; 3569971b13SSasha Levin struct iovec iov[VIRTIO_BLK_QUEUE_SIZE]; 3669971b13SSasha Levin u16 out, in, head; 378b52f877SSasha Levin struct kvm *kvm; 384749e795SSasha Levin }; 394749e795SSasha Levin 40fe2a70d1SSasha Levin struct blk_dev { 410528c2a7SPekka Enberg pthread_mutex_t mutex; 428b52f877SSasha Levin pthread_mutex_t req_mutex; 438b52f877SSasha Levin 44ebe9ac19SSasha Levin struct list_head list; 458b52f877SSasha Levin struct list_head req_list; 460528c2a7SPekka Enberg 47427948d5SSasha Levin struct virtio_pci vpci; 4840ce993fSPekka Enberg struct virtio_blk_config blk_config; 4938605e1cSSasha Levin struct disk_image *disk; 50427948d5SSasha Levin u32 features; 5110eca11dSPekka Enberg 5245e47970SAsias He struct virt_queue vqs[NUM_VIRT_QUEUES]; 538b52f877SSasha Levin struct blk_dev_req reqs[VIRTIO_BLK_QUEUE_SIZE]; 54fbc2fbf9SPekka Enberg }; 55fbc2fbf9SPekka Enberg 56ebe9ac19SSasha Levin static LIST_HEAD(bdevs); 57312c62d1SSasha Levin static int compat_id; 5840ce993fSPekka Enberg 598b52f877SSasha Levin static struct blk_dev_req *virtio_blk_req_pop(struct blk_dev *bdev) 604155ba8cSPekka Enberg { 618b52f877SSasha Levin struct blk_dev_req *req = NULL; 628b52f877SSasha Levin 638b52f877SSasha Levin mutex_lock(&bdev->req_mutex); 648b52f877SSasha Levin if (!list_empty(&bdev->req_list)) { 658b52f877SSasha Levin req = list_first_entry(&bdev->req_list, struct blk_dev_req, list); 668b52f877SSasha Levin list_del_init(&req->list); 678b52f877SSasha Levin } 688b52f877SSasha Levin mutex_unlock(&bdev->req_mutex); 698b52f877SSasha Levin 708b52f877SSasha Levin return req; 718b52f877SSasha Levin } 728b52f877SSasha Levin 738b52f877SSasha Levin static void virtio_blk_req_push(struct blk_dev *bdev, struct blk_dev_req *req) 748b52f877SSasha Levin { 758b52f877SSasha Levin mutex_lock(&bdev->req_mutex); 768b52f877SSasha Levin list_add(&req->list, &bdev->req_list); 778b52f877SSasha Levin mutex_unlock(&bdev->req_mutex); 788b52f877SSasha Levin } 798b52f877SSasha Levin 808b52f877SSasha Levin void virtio_blk_complete(void *param, long len) 818b52f877SSasha Levin { 828b52f877SSasha Levin struct blk_dev_req *req = param; 838b52f877SSasha Levin struct blk_dev *bdev = req->bdev; 848b52f877SSasha Levin int queueid = req->vq - bdev->vqs; 853fdf659dSSasha Levin u8 *status; 868b52f877SSasha Levin 878b52f877SSasha Levin /* status */ 888b52f877SSasha Levin status = req->iov[req->out + req->in - 1].iov_base; 898b52f877SSasha Levin *status = (len < 0) ? VIRTIO_BLK_S_IOERR : VIRTIO_BLK_S_OK; 908b52f877SSasha Levin 918b52f877SSasha Levin mutex_lock(&bdev->mutex); 928b52f877SSasha Levin virt_queue__set_used_elem(req->vq, req->head, len); 938b52f877SSasha Levin mutex_unlock(&bdev->mutex); 948b52f877SSasha Levin 958b52f877SSasha Levin virtio_pci__signal_vq(req->kvm, &bdev->vpci, queueid); 968b52f877SSasha Levin 978b52f877SSasha Levin virtio_blk_req_push(req->bdev, req); 988b52f877SSasha Levin } 998b52f877SSasha Levin 1008b52f877SSasha Levin static void virtio_blk_do_io_request(struct kvm *kvm, struct blk_dev_req *req) 1018b52f877SSasha Levin { 1028b52f877SSasha Levin struct virtio_blk_outhdr *req_hdr; 10369971b13SSasha Levin ssize_t block_cnt; 10469971b13SSasha Levin struct blk_dev *bdev; 10569971b13SSasha Levin struct iovec *iov; 106*f41a132bSSasha Levin u16 out, in; 1074155ba8cSPekka Enberg 10869971b13SSasha Levin block_cnt = -1; 1098b52f877SSasha Levin bdev = req->bdev; 1108b52f877SSasha Levin iov = req->iov; 1118b52f877SSasha Levin out = req->out; 1128b52f877SSasha Levin in = req->in; 1138b52f877SSasha Levin req_hdr = iov[0].iov_base; 11403110ff3SAsias He 1158b52f877SSasha Levin switch (req_hdr->type) { 11603110ff3SAsias He case VIRTIO_BLK_T_IN: 1178b52f877SSasha Levin block_cnt = disk_image__read(bdev->disk, req_hdr->sector, iov + 1, 118fb434ac3SSasha Levin in + out - 2, req); 119258dd093SPekka Enberg break; 12003110ff3SAsias He case VIRTIO_BLK_T_OUT: 1218b52f877SSasha Levin block_cnt = disk_image__write(bdev->disk, req_hdr->sector, iov + 1, 122fb434ac3SSasha Levin in + out - 2, req); 123258dd093SPekka Enberg break; 12429084a74SPrasad Joshi case VIRTIO_BLK_T_FLUSH: 12529084a74SPrasad Joshi block_cnt = disk_image__flush(bdev->disk); 126fb434ac3SSasha Levin virtio_blk_complete(req, block_cnt); 12729084a74SPrasad Joshi break; 128ff6462e8SSasha Levin case VIRTIO_BLK_T_GET_ID: 129ff6462e8SSasha Levin block_cnt = VIRTIO_BLK_ID_BYTES; 130ff6462e8SSasha Levin disk_image__get_serial(bdev->disk, (iov + 1)->iov_base, &block_cnt); 131fb434ac3SSasha Levin virtio_blk_complete(req, block_cnt); 132ff6462e8SSasha Levin break; 133258dd093SPekka Enberg default: 1348b52f877SSasha Levin pr_warning("request type %d", req_hdr->type); 13570b53f25SSasha Levin block_cnt = -1; 136407475bfSPekka Enberg break; 13703110ff3SAsias He } 1384155ba8cSPekka Enberg } 1394155ba8cSPekka Enberg 14069971b13SSasha Levin static void virtio_blk_do_io(struct kvm *kvm, struct virt_queue *vq, struct blk_dev *bdev) 14145e47970SAsias He { 14269971b13SSasha Levin while (virt_queue__available(vq)) { 1438b52f877SSasha Levin struct blk_dev_req *req = virtio_blk_req_pop(bdev); 144407475bfSPekka Enberg 1458b52f877SSasha Levin *req = (struct blk_dev_req) { 14669971b13SSasha Levin .vq = vq, 14769971b13SSasha Levin .bdev = bdev, 1488b52f877SSasha Levin .kvm = kvm, 14969971b13SSasha Levin }; 1508b52f877SSasha Levin req->head = virt_queue__get_iov(vq, req->iov, &req->out, &req->in, kvm); 15145e47970SAsias He 1528b52f877SSasha Levin virtio_blk_do_io_request(kvm, req); 15369971b13SSasha Levin } 1544baf6f73SSasha Levin } 1550528c2a7SPekka Enberg 156427948d5SSasha Levin static void set_config(struct kvm *kvm, void *dev, u8 data, u32 offset) 157427948d5SSasha Levin { 158427948d5SSasha Levin struct blk_dev *bdev = dev; 159427948d5SSasha Levin 160427948d5SSasha Levin ((u8 *)(&bdev->blk_config))[offset] = data; 161427948d5SSasha Levin } 162427948d5SSasha Levin 163427948d5SSasha Levin static u8 get_config(struct kvm *kvm, void *dev, u32 offset) 164427948d5SSasha Levin { 165427948d5SSasha Levin struct blk_dev *bdev = dev; 166427948d5SSasha Levin 167427948d5SSasha Levin return ((u8 *)(&bdev->blk_config))[offset]; 168427948d5SSasha Levin } 169427948d5SSasha Levin 170427948d5SSasha Levin static u32 get_host_features(struct kvm *kvm, void *dev) 171427948d5SSasha Levin { 172427948d5SSasha Levin return 1UL << VIRTIO_BLK_F_SEG_MAX | 1UL << VIRTIO_BLK_F_FLUSH; 173427948d5SSasha Levin } 174427948d5SSasha Levin 175427948d5SSasha Levin static void set_guest_features(struct kvm *kvm, void *dev, u32 features) 176427948d5SSasha Levin { 177427948d5SSasha Levin struct blk_dev *bdev = dev; 178427948d5SSasha Levin 179427948d5SSasha Levin bdev->features = features; 180427948d5SSasha Levin } 181427948d5SSasha Levin 182427948d5SSasha Levin static int init_vq(struct kvm *kvm, void *dev, u32 vq, u32 pfn) 183427948d5SSasha Levin { 184427948d5SSasha Levin struct blk_dev *bdev = dev; 185427948d5SSasha Levin struct virt_queue *queue; 186427948d5SSasha Levin void *p; 187427948d5SSasha Levin 188312c62d1SSasha Levin compat__remove_message(compat_id); 189427948d5SSasha Levin 190427948d5SSasha Levin queue = &bdev->vqs[vq]; 191427948d5SSasha Levin queue->pfn = pfn; 192427948d5SSasha Levin p = guest_pfn_to_host(kvm, queue->pfn); 193427948d5SSasha Levin 194427948d5SSasha Levin vring_init(&queue->vring, VIRTIO_BLK_QUEUE_SIZE, p, VIRTIO_PCI_VRING_ALIGN); 195427948d5SSasha Levin 196427948d5SSasha Levin return 0; 197427948d5SSasha Levin } 198427948d5SSasha Levin 199427948d5SSasha Levin static int notify_vq(struct kvm *kvm, void *dev, u32 vq) 200427948d5SSasha Levin { 201427948d5SSasha Levin struct blk_dev *bdev = dev; 202427948d5SSasha Levin 203427948d5SSasha Levin virtio_blk_do_io(kvm, &bdev->vqs[vq], bdev); 204427948d5SSasha Levin 205427948d5SSasha Levin return 0; 206427948d5SSasha Levin } 207427948d5SSasha Levin 208427948d5SSasha Levin static int get_pfn_vq(struct kvm *kvm, void *dev, u32 vq) 209427948d5SSasha Levin { 210427948d5SSasha Levin struct blk_dev *bdev = dev; 211427948d5SSasha Levin 212427948d5SSasha Levin return bdev->vqs[vq].pfn; 213427948d5SSasha Levin } 214427948d5SSasha Levin 215427948d5SSasha Levin static int get_size_vq(struct kvm *kvm, void *dev, u32 vq) 216427948d5SSasha Levin { 217427948d5SSasha Levin return VIRTIO_BLK_QUEUE_SIZE; 218427948d5SSasha Levin } 219427948d5SSasha Levin 22043835ac9SSasha Levin void virtio_blk__init(struct kvm *kvm, struct disk_image *disk) 2214749e795SSasha Levin { 222fe2a70d1SSasha Levin struct blk_dev *bdev; 2238b52f877SSasha Levin size_t i; 2244749e795SSasha Levin 2254749e795SSasha Levin if (!disk) 2264749e795SSasha Levin return; 2274749e795SSasha Levin 228ebe9ac19SSasha Levin bdev = calloc(1, sizeof(struct blk_dev)); 229ebe9ac19SSasha Levin if (bdev == NULL) 230fe2a70d1SSasha Levin die("Failed allocating bdev"); 2314749e795SSasha Levin 232fe2a70d1SSasha Levin *bdev = (struct blk_dev) { 2334749e795SSasha Levin .mutex = PTHREAD_MUTEX_INITIALIZER, 2348b52f877SSasha Levin .req_mutex = PTHREAD_MUTEX_INITIALIZER, 2354749e795SSasha Levin .disk = disk, 2364749e795SSasha Levin .blk_config = (struct virtio_blk_config) { 2374749e795SSasha Levin .capacity = disk->size / SECTOR_SIZE, 2383d7831a1SAsias He .seg_max = DISK_SEG_MAX, 2394749e795SSasha Levin }, 240427948d5SSasha Levin }; 241427948d5SSasha Levin 242507e02d8SAsias He virtio_pci__init(kvm, &bdev->vpci, bdev, PCI_DEVICE_ID_VIRTIO_BLK, VIRTIO_ID_BLOCK, PCI_CLASS_BLK); 243427948d5SSasha Levin bdev->vpci.ops = (struct virtio_pci_ops) { 244427948d5SSasha Levin .set_config = set_config, 245427948d5SSasha Levin .get_config = get_config, 246427948d5SSasha Levin .get_host_features = get_host_features, 247427948d5SSasha Levin .set_guest_features = set_guest_features, 248427948d5SSasha Levin .init_vq = init_vq, 249427948d5SSasha Levin .notify_vq = notify_vq, 250427948d5SSasha Levin .get_pfn_vq = get_pfn_vq, 251427948d5SSasha Levin .get_size_vq = get_size_vq, 252b30d05adSPekka Enberg }; 253b30d05adSPekka Enberg 254ebe9ac19SSasha Levin list_add_tail(&bdev->list, &bdevs); 255ebe9ac19SSasha Levin 2568b52f877SSasha Levin INIT_LIST_HEAD(&bdev->req_list); 2578b52f877SSasha Levin for (i = 0; i < ARRAY_SIZE(bdev->reqs); i++) 2588b52f877SSasha Levin list_add(&bdev->reqs[i].list, &bdev->req_list); 2598b52f877SSasha Levin 260fb434ac3SSasha Levin disk_image__set_callback(bdev->disk, virtio_blk_complete); 261fb434ac3SSasha Levin 262312c62d1SSasha Levin if (compat_id != -1) 263312c62d1SSasha Levin compat_id = compat__add_message("virtio-blk device was not detected", 264404d164bSSasha Levin "While you have requested a virtio-blk device, " 265fc835ab3SSasha Levin "the guest kernel did not initialize it.\n" 266fc835ab3SSasha Levin "Please make sure that the guest kernel was " 267fc835ab3SSasha Levin "compiled with CONFIG_VIRTIO_BLK=y enabled " 268fc835ab3SSasha Levin "in its .config"); 269b30d05adSPekka Enberg } 270bcb6aacaSPrasad Joshi 271bcb6aacaSPrasad Joshi void virtio_blk__init_all(struct kvm *kvm) 272bcb6aacaSPrasad Joshi { 273bcb6aacaSPrasad Joshi int i; 274bcb6aacaSPrasad Joshi 275bcb6aacaSPrasad Joshi for (i = 0; i < kvm->nr_disks; i++) 276bcb6aacaSPrasad Joshi virtio_blk__init(kvm, kvm->disks[i]); 277bcb6aacaSPrasad Joshi } 278a0a1e3c2SPrasad Joshi 279a0a1e3c2SPrasad Joshi void virtio_blk__delete_all(struct kvm *kvm) 280a0a1e3c2SPrasad Joshi { 281ebe9ac19SSasha Levin while (!list_empty(&bdevs)) { 282ebe9ac19SSasha Levin struct blk_dev *bdev; 283a0a1e3c2SPrasad Joshi 284ebe9ac19SSasha Levin bdev = list_first_entry(&bdevs, struct blk_dev, list); 285ebe9ac19SSasha Levin list_del(&bdev->list); 286ebe9ac19SSasha Levin free(bdev); 287ebe9ac19SSasha Levin } 288a0a1e3c2SPrasad Joshi } 289