1416b2c2dSAsias He #include "kvm/virtio-blk.h" 2b30d05adSPekka Enberg 331638bcaSCyrill Gorcunov #include "kvm/virtio-pci-dev.h" 45a24a9f2SPekka Enberg #include "kvm/disk-image.h" 539d6af07SAsias He #include "kvm/virtio.h" 64ef0f4d6SPekka Enberg #include "kvm/mutex.h" 7fe99fd4eSPekka Enberg #include "kvm/util.h" 88b1ff07eSPekka Enberg #include "kvm/kvm.h" 9b30d05adSPekka Enberg #include "kvm/pci.h" 10fb0957f2SSasha Levin #include "kvm/threadpool.h" 11ec75b82fSSasha Levin #include "kvm/ioeventfd.h" 12404d164bSSasha Levin #include "kvm/guest_compat.h" 13427948d5SSasha Levin #include "kvm/virtio-pci.h" 14b30d05adSPekka Enberg 1520c64ecaSPekka Enberg #include <linux/virtio_ring.h> 1620c64ecaSPekka Enberg #include <linux/virtio_blk.h> 170528c2a7SPekka Enberg 18427948d5SSasha Levin #include <linux/kernel.h> 19ebe9ac19SSasha Levin #include <linux/list.h> 203fdf659dSSasha Levin #include <linux/types.h> 210528c2a7SPekka Enberg #include <pthread.h> 224155ba8cSPekka Enberg 234749e795SSasha Levin #define VIRTIO_BLK_MAX_DEV 4 2410eca11dSPekka Enberg #define NUM_VIRT_QUEUES 1 2510eca11dSPekka Enberg 2603110ff3SAsias He #define VIRTIO_BLK_QUEUE_SIZE 128 273d7831a1SAsias He /* 283d7831a1SAsias He * the header and status consume too entries 293d7831a1SAsias He */ 303d7831a1SAsias He #define DISK_SEG_MAX (VIRTIO_BLK_QUEUE_SIZE - 2) 3110eca11dSPekka Enberg 328b52f877SSasha Levin struct blk_dev_req { 338b52f877SSasha Levin struct list_head list; 344749e795SSasha Levin struct virt_queue *vq; 35fe2a70d1SSasha Levin struct blk_dev *bdev; 3669971b13SSasha Levin struct iovec iov[VIRTIO_BLK_QUEUE_SIZE]; 3769971b13SSasha Levin u16 out, in, head; 388b52f877SSasha Levin struct kvm *kvm; 394749e795SSasha Levin }; 404749e795SSasha Levin 41fe2a70d1SSasha Levin struct blk_dev { 420528c2a7SPekka Enberg pthread_mutex_t mutex; 438b52f877SSasha Levin pthread_mutex_t req_mutex; 448b52f877SSasha Levin 45ebe9ac19SSasha Levin struct list_head list; 468b52f877SSasha Levin struct list_head req_list; 470528c2a7SPekka Enberg 48427948d5SSasha Levin struct virtio_pci vpci; 4940ce993fSPekka Enberg struct virtio_blk_config blk_config; 5038605e1cSSasha Levin struct disk_image *disk; 51427948d5SSasha Levin u32 features; 5210eca11dSPekka Enberg 5345e47970SAsias He struct virt_queue vqs[NUM_VIRT_QUEUES]; 548b52f877SSasha Levin struct blk_dev_req reqs[VIRTIO_BLK_QUEUE_SIZE]; 55fbc2fbf9SPekka Enberg }; 56fbc2fbf9SPekka Enberg 57ebe9ac19SSasha Levin static LIST_HEAD(bdevs); 58312c62d1SSasha Levin static int compat_id; 5940ce993fSPekka Enberg 608b52f877SSasha Levin static struct blk_dev_req *virtio_blk_req_pop(struct blk_dev *bdev) 614155ba8cSPekka Enberg { 628b52f877SSasha Levin struct blk_dev_req *req = NULL; 638b52f877SSasha Levin 648b52f877SSasha Levin mutex_lock(&bdev->req_mutex); 658b52f877SSasha Levin if (!list_empty(&bdev->req_list)) { 668b52f877SSasha Levin req = list_first_entry(&bdev->req_list, struct blk_dev_req, list); 678b52f877SSasha Levin list_del_init(&req->list); 688b52f877SSasha Levin } 698b52f877SSasha Levin mutex_unlock(&bdev->req_mutex); 708b52f877SSasha Levin 718b52f877SSasha Levin return req; 728b52f877SSasha Levin } 738b52f877SSasha Levin 748b52f877SSasha Levin static void virtio_blk_req_push(struct blk_dev *bdev, struct blk_dev_req *req) 758b52f877SSasha Levin { 768b52f877SSasha Levin mutex_lock(&bdev->req_mutex); 778b52f877SSasha Levin list_add(&req->list, &bdev->req_list); 788b52f877SSasha Levin mutex_unlock(&bdev->req_mutex); 798b52f877SSasha Levin } 808b52f877SSasha Levin 818b52f877SSasha Levin void virtio_blk_complete(void *param, long len) 828b52f877SSasha Levin { 838b52f877SSasha Levin struct blk_dev_req *req = param; 848b52f877SSasha Levin struct blk_dev *bdev = req->bdev; 858b52f877SSasha Levin int queueid = req->vq - bdev->vqs; 863fdf659dSSasha Levin u8 *status; 878b52f877SSasha Levin 888b52f877SSasha Levin /* status */ 898b52f877SSasha Levin status = req->iov[req->out + req->in - 1].iov_base; 908b52f877SSasha Levin *status = (len < 0) ? VIRTIO_BLK_S_IOERR : VIRTIO_BLK_S_OK; 918b52f877SSasha Levin 928b52f877SSasha Levin mutex_lock(&bdev->mutex); 938b52f877SSasha Levin virt_queue__set_used_elem(req->vq, req->head, len); 948b52f877SSasha Levin mutex_unlock(&bdev->mutex); 958b52f877SSasha Levin 968b52f877SSasha Levin virtio_pci__signal_vq(req->kvm, &bdev->vpci, queueid); 978b52f877SSasha Levin 988b52f877SSasha Levin virtio_blk_req_push(req->bdev, req); 998b52f877SSasha Levin } 1008b52f877SSasha Levin 1018b52f877SSasha Levin static void virtio_blk_do_io_request(struct kvm *kvm, struct blk_dev_req *req) 1028b52f877SSasha Levin { 1038b52f877SSasha Levin struct virtio_blk_outhdr *req_hdr; 10469971b13SSasha Levin ssize_t block_cnt; 10569971b13SSasha Levin struct blk_dev *bdev; 10669971b13SSasha Levin struct virt_queue *queue; 10769971b13SSasha Levin struct iovec *iov; 10869971b13SSasha Levin u16 out, in, head; 1094155ba8cSPekka Enberg 11069971b13SSasha Levin block_cnt = -1; 1118b52f877SSasha Levin bdev = req->bdev; 1128b52f877SSasha Levin queue = req->vq; 1138b52f877SSasha Levin iov = req->iov; 1148b52f877SSasha Levin out = req->out; 1158b52f877SSasha Levin in = req->in; 1168b52f877SSasha Levin head = req->head; 1178b52f877SSasha Levin req_hdr = iov[0].iov_base; 11803110ff3SAsias He 1198b52f877SSasha Levin switch (req_hdr->type) { 12003110ff3SAsias He case VIRTIO_BLK_T_IN: 1218b52f877SSasha Levin block_cnt = disk_image__read(bdev->disk, req_hdr->sector, iov + 1, 122*fb434ac3SSasha Levin in + out - 2, req); 123258dd093SPekka Enberg break; 12403110ff3SAsias He case VIRTIO_BLK_T_OUT: 1258b52f877SSasha Levin block_cnt = disk_image__write(bdev->disk, req_hdr->sector, iov + 1, 126*fb434ac3SSasha Levin in + out - 2, req); 127258dd093SPekka Enberg break; 12829084a74SPrasad Joshi case VIRTIO_BLK_T_FLUSH: 12929084a74SPrasad Joshi block_cnt = disk_image__flush(bdev->disk); 130*fb434ac3SSasha Levin virtio_blk_complete(req, block_cnt); 13129084a74SPrasad Joshi break; 132ff6462e8SSasha Levin case VIRTIO_BLK_T_GET_ID: 133ff6462e8SSasha Levin block_cnt = VIRTIO_BLK_ID_BYTES; 134ff6462e8SSasha Levin disk_image__get_serial(bdev->disk, (iov + 1)->iov_base, &block_cnt); 135*fb434ac3SSasha Levin virtio_blk_complete(req, block_cnt); 136ff6462e8SSasha Levin break; 137258dd093SPekka Enberg default: 1388b52f877SSasha Levin pr_warning("request type %d", req_hdr->type); 13970b53f25SSasha Levin block_cnt = -1; 140407475bfSPekka Enberg break; 14103110ff3SAsias He } 1424155ba8cSPekka Enberg } 1434155ba8cSPekka Enberg 14469971b13SSasha Levin static void virtio_blk_do_io(struct kvm *kvm, struct virt_queue *vq, struct blk_dev *bdev) 14545e47970SAsias He { 14669971b13SSasha Levin while (virt_queue__available(vq)) { 1478b52f877SSasha Levin struct blk_dev_req *req = virtio_blk_req_pop(bdev); 148407475bfSPekka Enberg 1498b52f877SSasha Levin *req = (struct blk_dev_req) { 15069971b13SSasha Levin .vq = vq, 15169971b13SSasha Levin .bdev = bdev, 1528b52f877SSasha Levin .kvm = kvm, 15369971b13SSasha Levin }; 1548b52f877SSasha Levin req->head = virt_queue__get_iov(vq, req->iov, &req->out, &req->in, kvm); 15545e47970SAsias He 1568b52f877SSasha Levin virtio_blk_do_io_request(kvm, req); 15769971b13SSasha Levin } 1584baf6f73SSasha Levin } 1590528c2a7SPekka Enberg 160427948d5SSasha Levin static void set_config(struct kvm *kvm, void *dev, u8 data, u32 offset) 161427948d5SSasha Levin { 162427948d5SSasha Levin struct blk_dev *bdev = dev; 163427948d5SSasha Levin 164427948d5SSasha Levin ((u8 *)(&bdev->blk_config))[offset] = data; 165427948d5SSasha Levin } 166427948d5SSasha Levin 167427948d5SSasha Levin static u8 get_config(struct kvm *kvm, void *dev, u32 offset) 168427948d5SSasha Levin { 169427948d5SSasha Levin struct blk_dev *bdev = dev; 170427948d5SSasha Levin 171427948d5SSasha Levin return ((u8 *)(&bdev->blk_config))[offset]; 172427948d5SSasha Levin } 173427948d5SSasha Levin 174427948d5SSasha Levin static u32 get_host_features(struct kvm *kvm, void *dev) 175427948d5SSasha Levin { 176427948d5SSasha Levin return 1UL << VIRTIO_BLK_F_SEG_MAX | 1UL << VIRTIO_BLK_F_FLUSH; 177427948d5SSasha Levin } 178427948d5SSasha Levin 179427948d5SSasha Levin static void set_guest_features(struct kvm *kvm, void *dev, u32 features) 180427948d5SSasha Levin { 181427948d5SSasha Levin struct blk_dev *bdev = dev; 182427948d5SSasha Levin 183427948d5SSasha Levin bdev->features = features; 184427948d5SSasha Levin } 185427948d5SSasha Levin 186427948d5SSasha Levin static int init_vq(struct kvm *kvm, void *dev, u32 vq, u32 pfn) 187427948d5SSasha Levin { 188427948d5SSasha Levin struct blk_dev *bdev = dev; 189427948d5SSasha Levin struct virt_queue *queue; 190427948d5SSasha Levin void *p; 191427948d5SSasha Levin 192312c62d1SSasha Levin compat__remove_message(compat_id); 193427948d5SSasha Levin 194427948d5SSasha Levin queue = &bdev->vqs[vq]; 195427948d5SSasha Levin queue->pfn = pfn; 196427948d5SSasha Levin p = guest_pfn_to_host(kvm, queue->pfn); 197427948d5SSasha Levin 198427948d5SSasha Levin vring_init(&queue->vring, VIRTIO_BLK_QUEUE_SIZE, p, VIRTIO_PCI_VRING_ALIGN); 199427948d5SSasha Levin 200427948d5SSasha Levin return 0; 201427948d5SSasha Levin } 202427948d5SSasha Levin 203427948d5SSasha Levin static int notify_vq(struct kvm *kvm, void *dev, u32 vq) 204427948d5SSasha Levin { 205427948d5SSasha Levin struct blk_dev *bdev = dev; 206427948d5SSasha Levin 207427948d5SSasha Levin virtio_blk_do_io(kvm, &bdev->vqs[vq], bdev); 208427948d5SSasha Levin 209427948d5SSasha Levin return 0; 210427948d5SSasha Levin } 211427948d5SSasha Levin 212427948d5SSasha Levin static int get_pfn_vq(struct kvm *kvm, void *dev, u32 vq) 213427948d5SSasha Levin { 214427948d5SSasha Levin struct blk_dev *bdev = dev; 215427948d5SSasha Levin 216427948d5SSasha Levin return bdev->vqs[vq].pfn; 217427948d5SSasha Levin } 218427948d5SSasha Levin 219427948d5SSasha Levin static int get_size_vq(struct kvm *kvm, void *dev, u32 vq) 220427948d5SSasha Levin { 221427948d5SSasha Levin return VIRTIO_BLK_QUEUE_SIZE; 222427948d5SSasha Levin } 223427948d5SSasha Levin 22443835ac9SSasha Levin void virtio_blk__init(struct kvm *kvm, struct disk_image *disk) 2254749e795SSasha Levin { 226fe2a70d1SSasha Levin struct blk_dev *bdev; 2278b52f877SSasha Levin size_t i; 2284749e795SSasha Levin 2294749e795SSasha Levin if (!disk) 2304749e795SSasha Levin return; 2314749e795SSasha Levin 232ebe9ac19SSasha Levin bdev = calloc(1, sizeof(struct blk_dev)); 233ebe9ac19SSasha Levin if (bdev == NULL) 234fe2a70d1SSasha Levin die("Failed allocating bdev"); 2354749e795SSasha Levin 236fe2a70d1SSasha Levin *bdev = (struct blk_dev) { 2374749e795SSasha Levin .mutex = PTHREAD_MUTEX_INITIALIZER, 2388b52f877SSasha Levin .req_mutex = PTHREAD_MUTEX_INITIALIZER, 2394749e795SSasha Levin .disk = disk, 2404749e795SSasha Levin .blk_config = (struct virtio_blk_config) { 2414749e795SSasha Levin .capacity = disk->size / SECTOR_SIZE, 2423d7831a1SAsias He .seg_max = DISK_SEG_MAX, 2434749e795SSasha Levin }, 244427948d5SSasha Levin }; 245427948d5SSasha Levin 246507e02d8SAsias He virtio_pci__init(kvm, &bdev->vpci, bdev, PCI_DEVICE_ID_VIRTIO_BLK, VIRTIO_ID_BLOCK, PCI_CLASS_BLK); 247427948d5SSasha Levin bdev->vpci.ops = (struct virtio_pci_ops) { 248427948d5SSasha Levin .set_config = set_config, 249427948d5SSasha Levin .get_config = get_config, 250427948d5SSasha Levin .get_host_features = get_host_features, 251427948d5SSasha Levin .set_guest_features = set_guest_features, 252427948d5SSasha Levin .init_vq = init_vq, 253427948d5SSasha Levin .notify_vq = notify_vq, 254427948d5SSasha Levin .get_pfn_vq = get_pfn_vq, 255427948d5SSasha Levin .get_size_vq = get_size_vq, 256b30d05adSPekka Enberg }; 257b30d05adSPekka Enberg 258ebe9ac19SSasha Levin list_add_tail(&bdev->list, &bdevs); 259ebe9ac19SSasha Levin 2608b52f877SSasha Levin INIT_LIST_HEAD(&bdev->req_list); 2618b52f877SSasha Levin for (i = 0; i < ARRAY_SIZE(bdev->reqs); i++) 2628b52f877SSasha Levin list_add(&bdev->reqs[i].list, &bdev->req_list); 2638b52f877SSasha Levin 264*fb434ac3SSasha Levin disk_image__set_callback(bdev->disk, virtio_blk_complete); 265*fb434ac3SSasha Levin 266312c62d1SSasha Levin if (compat_id != -1) 267312c62d1SSasha Levin compat_id = compat__add_message("virtio-blk device was not detected", 268404d164bSSasha Levin "While you have requested a virtio-blk device, " 269fc835ab3SSasha Levin "the guest kernel did not initialize it.\n" 270fc835ab3SSasha Levin "Please make sure that the guest kernel was " 271fc835ab3SSasha Levin "compiled with CONFIG_VIRTIO_BLK=y enabled " 272fc835ab3SSasha Levin "in its .config"); 273b30d05adSPekka Enberg } 274bcb6aacaSPrasad Joshi 275bcb6aacaSPrasad Joshi void virtio_blk__init_all(struct kvm *kvm) 276bcb6aacaSPrasad Joshi { 277bcb6aacaSPrasad Joshi int i; 278bcb6aacaSPrasad Joshi 279bcb6aacaSPrasad Joshi for (i = 0; i < kvm->nr_disks; i++) 280bcb6aacaSPrasad Joshi virtio_blk__init(kvm, kvm->disks[i]); 281bcb6aacaSPrasad Joshi } 282a0a1e3c2SPrasad Joshi 283a0a1e3c2SPrasad Joshi void virtio_blk__delete_all(struct kvm *kvm) 284a0a1e3c2SPrasad Joshi { 285ebe9ac19SSasha Levin while (!list_empty(&bdevs)) { 286ebe9ac19SSasha Levin struct blk_dev *bdev; 287a0a1e3c2SPrasad Joshi 288ebe9ac19SSasha Levin bdev = list_first_entry(&bdevs, struct blk_dev, list); 289ebe9ac19SSasha Levin list_del(&bdev->list); 290ebe9ac19SSasha Levin free(bdev); 291ebe9ac19SSasha Levin } 292a0a1e3c2SPrasad Joshi } 293