xref: /kvmtool/virtio/blk.c (revision 95242e44535bfb37b4ac4c90c353d5b73824a08e)
1416b2c2dSAsias He #include "kvm/virtio-blk.h"
2b30d05adSPekka Enberg 
331638bcaSCyrill Gorcunov #include "kvm/virtio-pci-dev.h"
45a24a9f2SPekka Enberg #include "kvm/disk-image.h"
54ef0f4d6SPekka Enberg #include "kvm/mutex.h"
6fe99fd4eSPekka Enberg #include "kvm/util.h"
78b1ff07eSPekka Enberg #include "kvm/kvm.h"
8b30d05adSPekka Enberg #include "kvm/pci.h"
9fb0957f2SSasha Levin #include "kvm/threadpool.h"
10ec75b82fSSasha Levin #include "kvm/ioeventfd.h"
11404d164bSSasha Levin #include "kvm/guest_compat.h"
12427948d5SSasha Levin #include "kvm/virtio-pci.h"
13f41a132bSSasha Levin #include "kvm/virtio.h"
14b30d05adSPekka Enberg 
1520c64ecaSPekka Enberg #include <linux/virtio_ring.h>
1620c64ecaSPekka Enberg #include <linux/virtio_blk.h>
17427948d5SSasha Levin #include <linux/kernel.h>
18ebe9ac19SSasha Levin #include <linux/list.h>
193fdf659dSSasha Levin #include <linux/types.h>
200528c2a7SPekka Enberg #include <pthread.h>
214155ba8cSPekka Enberg 
224749e795SSasha Levin #define VIRTIO_BLK_MAX_DEV		4
2310eca11dSPekka Enberg 
243d7831a1SAsias He /*
253d7831a1SAsias He  * the header and status consume too entries
263d7831a1SAsias He  */
273d7831a1SAsias He #define DISK_SEG_MAX			(VIRTIO_BLK_QUEUE_SIZE - 2)
284059ad8bSAsias He #define VIRTIO_BLK_QUEUE_SIZE		256
29f41a132bSSasha Levin #define NUM_VIRT_QUEUES			1
3010eca11dSPekka Enberg 
318b52f877SSasha Levin struct blk_dev_req {
324749e795SSasha Levin 	struct virt_queue		*vq;
33fe2a70d1SSasha Levin 	struct blk_dev			*bdev;
3469971b13SSasha Levin 	struct iovec			iov[VIRTIO_BLK_QUEUE_SIZE];
3569971b13SSasha Levin 	u16				out, in, head;
368b52f877SSasha Levin 	struct kvm			*kvm;
374749e795SSasha Levin };
384749e795SSasha Levin 
39fe2a70d1SSasha Levin struct blk_dev {
40d3476f7dSSasha Levin 	struct mutex			mutex;
418b52f877SSasha Levin 
42ebe9ac19SSasha Levin 	struct list_head		list;
430528c2a7SPekka Enberg 
4402eca50cSAsias He 	struct virtio_device		vdev;
4540ce993fSPekka Enberg 	struct virtio_blk_config	blk_config;
4638605e1cSSasha Levin 	struct disk_image		*disk;
47427948d5SSasha Levin 	u32				features;
4810eca11dSPekka Enberg 
4945e47970SAsias He 	struct virt_queue		vqs[NUM_VIRT_QUEUES];
508b52f877SSasha Levin 	struct blk_dev_req		reqs[VIRTIO_BLK_QUEUE_SIZE];
515ac1178bSAsias He 
525ac1178bSAsias He 	pthread_t			io_thread;
535ac1178bSAsias He 	int				io_efd;
545ac1178bSAsias He 
555ac1178bSAsias He 	struct kvm			*kvm;
56fbc2fbf9SPekka Enberg };
57fbc2fbf9SPekka Enberg 
58ebe9ac19SSasha Levin static LIST_HEAD(bdevs);
59bdbbcb63SAsias He static int compat_id = -1;
6040ce993fSPekka Enberg 
618b52f877SSasha Levin void virtio_blk_complete(void *param, long len)
628b52f877SSasha Levin {
638b52f877SSasha Levin 	struct blk_dev_req *req = param;
648b52f877SSasha Levin 	struct blk_dev *bdev = req->bdev;
658b52f877SSasha Levin 	int queueid = req->vq - bdev->vqs;
663fdf659dSSasha Levin 	u8 *status;
678b52f877SSasha Levin 
688b52f877SSasha Levin 	/* status */
698b52f877SSasha Levin 	status	= req->iov[req->out + req->in - 1].iov_base;
708b52f877SSasha Levin 	*status	= (len < 0) ? VIRTIO_BLK_S_IOERR : VIRTIO_BLK_S_OK;
718b52f877SSasha Levin 
728b52f877SSasha Levin 	mutex_lock(&bdev->mutex);
738b52f877SSasha Levin 	virt_queue__set_used_elem(req->vq, req->head, len);
748b52f877SSasha Levin 	mutex_unlock(&bdev->mutex);
758b52f877SSasha Levin 
767ab3d207SSasha Levin 	if (virtio_queue__should_signal(&bdev->vqs[queueid]))
7702eca50cSAsias He 		bdev->vdev.ops->signal_vq(req->kvm, &bdev->vdev, queueid);
788b52f877SSasha Levin }
798b52f877SSasha Levin 
8001dafc9eSMarc Zyngier static void virtio_blk_do_io_request(struct kvm *kvm, struct virt_queue *vq, struct blk_dev_req *req)
818b52f877SSasha Levin {
828b52f877SSasha Levin 	struct virtio_blk_outhdr *req_hdr;
8369971b13SSasha Levin 	ssize_t block_cnt;
8469971b13SSasha Levin 	struct blk_dev *bdev;
8569971b13SSasha Levin 	struct iovec *iov;
86f41a132bSSasha Levin 	u16 out, in;
8701dafc9eSMarc Zyngier 	u32 type;
8801dafc9eSMarc Zyngier 	u64 sector;
894155ba8cSPekka Enberg 
9069971b13SSasha Levin 	block_cnt	= -1;
918b52f877SSasha Levin 	bdev		= req->bdev;
928b52f877SSasha Levin 	iov		= req->iov;
938b52f877SSasha Levin 	out		= req->out;
948b52f877SSasha Levin 	in		= req->in;
958b52f877SSasha Levin 	req_hdr		= iov[0].iov_base;
9603110ff3SAsias He 
9701dafc9eSMarc Zyngier 	type = virtio_guest_to_host_u32(vq, req_hdr->type);
9801dafc9eSMarc Zyngier 	sector = virtio_guest_to_host_u64(vq, req_hdr->sector);
9901dafc9eSMarc Zyngier 
10001dafc9eSMarc Zyngier 	switch (type) {
10103110ff3SAsias He 	case VIRTIO_BLK_T_IN:
10201dafc9eSMarc Zyngier 		block_cnt = disk_image__read(bdev->disk, sector,
10334239c78SAsias He 				iov + 1, in + out - 2, req);
104258dd093SPekka Enberg 		break;
10503110ff3SAsias He 	case VIRTIO_BLK_T_OUT:
10601dafc9eSMarc Zyngier 		block_cnt = disk_image__write(bdev->disk, sector,
10734239c78SAsias He 				iov + 1, in + out - 2, req);
108258dd093SPekka Enberg 		break;
10929084a74SPrasad Joshi 	case VIRTIO_BLK_T_FLUSH:
11029084a74SPrasad Joshi 		block_cnt = disk_image__flush(bdev->disk);
111fb434ac3SSasha Levin 		virtio_blk_complete(req, block_cnt);
11229084a74SPrasad Joshi 		break;
113ff6462e8SSasha Levin 	case VIRTIO_BLK_T_GET_ID:
114ff6462e8SSasha Levin 		block_cnt = VIRTIO_BLK_ID_BYTES;
11534239c78SAsias He 		disk_image__get_serial(bdev->disk,
11634239c78SAsias He 				(iov + 1)->iov_base, &block_cnt);
117fb434ac3SSasha Levin 		virtio_blk_complete(req, block_cnt);
118ff6462e8SSasha Levin 		break;
119258dd093SPekka Enberg 	default:
12001dafc9eSMarc Zyngier 		pr_warning("request type %d", type);
12170b53f25SSasha Levin 		block_cnt	= -1;
122407475bfSPekka Enberg 		break;
12303110ff3SAsias He 	}
1244155ba8cSPekka Enberg }
1254155ba8cSPekka Enberg 
12669971b13SSasha Levin static void virtio_blk_do_io(struct kvm *kvm, struct virt_queue *vq, struct blk_dev *bdev)
12745e47970SAsias He {
1282fddfdb5SAsias He 	struct blk_dev_req *req;
1292fddfdb5SAsias He 	u16 head;
130407475bfSPekka Enberg 
1312fddfdb5SAsias He 	while (virt_queue__available(vq)) {
1322fddfdb5SAsias He 		head		= virt_queue__pop(vq);
1332fddfdb5SAsias He 		req		= &bdev->reqs[head];
13434239c78SAsias He 		req->head	= virt_queue__get_head_iov(vq, req->iov, &req->out,
13534239c78SAsias He 					&req->in, head, kvm);
1362fddfdb5SAsias He 		req->vq		= vq;
13745e47970SAsias He 
13801dafc9eSMarc Zyngier 		virtio_blk_do_io_request(kvm, vq, req);
13969971b13SSasha Levin 	}
1404baf6f73SSasha Levin }
1410528c2a7SPekka Enberg 
142c5ae742bSSasha Levin static u8 *get_config(struct kvm *kvm, void *dev)
143427948d5SSasha Levin {
144427948d5SSasha Levin 	struct blk_dev *bdev = dev;
145427948d5SSasha Levin 
146c5ae742bSSasha Levin 	return ((u8 *)(&bdev->blk_config));
147427948d5SSasha Levin }
148427948d5SSasha Levin 
149427948d5SSasha Levin static u32 get_host_features(struct kvm *kvm, void *dev)
150427948d5SSasha Levin {
1517ab3d207SSasha Levin 	return	1UL << VIRTIO_BLK_F_SEG_MAX
1527ab3d207SSasha Levin 		| 1UL << VIRTIO_BLK_F_FLUSH
153754c8ce3SSasha Levin 		| 1UL << VIRTIO_RING_F_EVENT_IDX
154754c8ce3SSasha Levin 		| 1UL << VIRTIO_RING_F_INDIRECT_DESC;
155427948d5SSasha Levin }
156427948d5SSasha Levin 
157427948d5SSasha Levin static void set_guest_features(struct kvm *kvm, void *dev, u32 features)
158427948d5SSasha Levin {
159427948d5SSasha Levin 	struct blk_dev *bdev = dev;
16001dafc9eSMarc Zyngier 	struct virtio_blk_config *conf = &bdev->blk_config;
16101dafc9eSMarc Zyngier 	struct virtio_blk_geometry *geo = &conf->geometry;
162427948d5SSasha Levin 
163427948d5SSasha Levin 	bdev->features = features;
16401dafc9eSMarc Zyngier 
16501dafc9eSMarc Zyngier 	conf->capacity = virtio_host_to_guest_u64(&bdev->vdev, conf->capacity);
16601dafc9eSMarc Zyngier 	conf->size_max = virtio_host_to_guest_u32(&bdev->vdev, conf->size_max);
16701dafc9eSMarc Zyngier 	conf->seg_max = virtio_host_to_guest_u32(&bdev->vdev, conf->seg_max);
16801dafc9eSMarc Zyngier 
16901dafc9eSMarc Zyngier 	/* Geometry */
17001dafc9eSMarc Zyngier 	geo->cylinders = virtio_host_to_guest_u16(&bdev->vdev, geo->cylinders);
17101dafc9eSMarc Zyngier 
17201dafc9eSMarc Zyngier 	conf->blk_size = virtio_host_to_guest_u32(&bdev->vdev, conf->blk_size);
17301dafc9eSMarc Zyngier 	conf->min_io_size = virtio_host_to_guest_u16(&bdev->vdev, conf->min_io_size);
17401dafc9eSMarc Zyngier 	conf->opt_io_size = virtio_host_to_guest_u32(&bdev->vdev, conf->opt_io_size);
175427948d5SSasha Levin }
176427948d5SSasha Levin 
177*95242e44SJean-Philippe Brucker static void notify_status(struct kvm *kvm, void *dev, u32 status)
178*95242e44SJean-Philippe Brucker {
179*95242e44SJean-Philippe Brucker }
180*95242e44SJean-Philippe Brucker 
181c59ba304SWill Deacon static int init_vq(struct kvm *kvm, void *dev, u32 vq, u32 page_size, u32 align,
182c59ba304SWill Deacon 		   u32 pfn)
183427948d5SSasha Levin {
184427948d5SSasha Levin 	struct blk_dev *bdev = dev;
185427948d5SSasha Levin 	struct virt_queue *queue;
186427948d5SSasha Levin 	void *p;
187427948d5SSasha Levin 
188312c62d1SSasha Levin 	compat__remove_message(compat_id);
189427948d5SSasha Levin 
190427948d5SSasha Levin 	queue		= &bdev->vqs[vq];
191427948d5SSasha Levin 	queue->pfn	= pfn;
192e7e2950aSSasha Levin 	p		= virtio_get_vq(kvm, queue->pfn, page_size);
193427948d5SSasha Levin 
194c59ba304SWill Deacon 	vring_init(&queue->vring, VIRTIO_BLK_QUEUE_SIZE, p, align);
19501dafc9eSMarc Zyngier 	virtio_init_device_vq(&bdev->vdev, queue);
196427948d5SSasha Levin 
197427948d5SSasha Levin 	return 0;
198427948d5SSasha Levin }
199427948d5SSasha Levin 
2005ac1178bSAsias He static void *virtio_blk_thread(void *dev)
2015ac1178bSAsias He {
2025ac1178bSAsias He 	struct blk_dev *bdev = dev;
2035ac1178bSAsias He 	u64 data;
204a7aa454eSSasha Levin 	int r;
2055ac1178bSAsias He 
206a4d8c55eSSasha Levin 	kvm__set_thread_name("virtio-blk-io");
207a4d8c55eSSasha Levin 
2085ac1178bSAsias He 	while (1) {
209a7aa454eSSasha Levin 		r = read(bdev->io_efd, &data, sizeof(u64));
210a7aa454eSSasha Levin 		if (r < 0)
211a7aa454eSSasha Levin 			continue;
2125ac1178bSAsias He 		virtio_blk_do_io(bdev->kvm, &bdev->vqs[0], bdev);
2135ac1178bSAsias He 	}
2145ac1178bSAsias He 
2155ac1178bSAsias He 	pthread_exit(NULL);
2165ac1178bSAsias He 	return NULL;
2175ac1178bSAsias He }
2185ac1178bSAsias He 
219427948d5SSasha Levin static int notify_vq(struct kvm *kvm, void *dev, u32 vq)
220427948d5SSasha Levin {
221427948d5SSasha Levin 	struct blk_dev *bdev = dev;
2225ac1178bSAsias He 	u64 data = 1;
223a7aa454eSSasha Levin 	int r;
224427948d5SSasha Levin 
225a7aa454eSSasha Levin 	r = write(bdev->io_efd, &data, sizeof(data));
226a7aa454eSSasha Levin 	if (r < 0)
227a7aa454eSSasha Levin 		return r;
228427948d5SSasha Levin 
229427948d5SSasha Levin 	return 0;
230427948d5SSasha Levin }
231427948d5SSasha Levin 
232427948d5SSasha Levin static int get_pfn_vq(struct kvm *kvm, void *dev, u32 vq)
233427948d5SSasha Levin {
234427948d5SSasha Levin 	struct blk_dev *bdev = dev;
235427948d5SSasha Levin 
236427948d5SSasha Levin 	return bdev->vqs[vq].pfn;
237427948d5SSasha Levin }
238427948d5SSasha Levin 
239427948d5SSasha Levin static int get_size_vq(struct kvm *kvm, void *dev, u32 vq)
240427948d5SSasha Levin {
241ffcc904aSAsias He 	/* FIXME: dynamic */
242427948d5SSasha Levin 	return VIRTIO_BLK_QUEUE_SIZE;
243427948d5SSasha Levin }
244427948d5SSasha Levin 
245ffcc904aSAsias He static int set_size_vq(struct kvm *kvm, void *dev, u32 vq, int size)
246ffcc904aSAsias He {
247ffcc904aSAsias He 	/* FIXME: dynamic */
248ffcc904aSAsias He 	return size;
249ffcc904aSAsias He }
250ffcc904aSAsias He 
25115542babSAndre Przywara static struct virtio_ops blk_dev_virtio_ops = {
2521c47ce69SSasha Levin 	.get_config		= get_config,
2531c47ce69SSasha Levin 	.get_host_features	= get_host_features,
2541c47ce69SSasha Levin 	.set_guest_features	= set_guest_features,
2551c47ce69SSasha Levin 	.init_vq		= init_vq,
256*95242e44SJean-Philippe Brucker 	.notify_status		= notify_status,
2571c47ce69SSasha Levin 	.notify_vq		= notify_vq,
2581c47ce69SSasha Levin 	.get_pfn_vq		= get_pfn_vq,
2591c47ce69SSasha Levin 	.get_size_vq		= get_size_vq,
260ffcc904aSAsias He 	.set_size_vq		= set_size_vq,
2611c47ce69SSasha Levin };
2621c47ce69SSasha Levin 
2639f9207c5SSasha Levin static int virtio_blk__init_one(struct kvm *kvm, struct disk_image *disk)
2644749e795SSasha Levin {
265fe2a70d1SSasha Levin 	struct blk_dev *bdev;
2662fddfdb5SAsias He 	unsigned int i;
2674749e795SSasha Levin 
2684749e795SSasha Levin 	if (!disk)
2699f9207c5SSasha Levin 		return -EINVAL;
2704749e795SSasha Levin 
271ebe9ac19SSasha Levin 	bdev = calloc(1, sizeof(struct blk_dev));
272ebe9ac19SSasha Levin 	if (bdev == NULL)
2739f9207c5SSasha Levin 		return -ENOMEM;
2744749e795SSasha Levin 
275fe2a70d1SSasha Levin 	*bdev = (struct blk_dev) {
276d3476f7dSSasha Levin 		.mutex			= MUTEX_INITIALIZER,
2774749e795SSasha Levin 		.disk			= disk,
2784749e795SSasha Levin 		.blk_config		= (struct virtio_blk_config) {
2794749e795SSasha Levin 			.capacity	= disk->size / SECTOR_SIZE,
2803d7831a1SAsias He 			.seg_max	= DISK_SEG_MAX,
2814749e795SSasha Levin 		},
2825ac1178bSAsias He 		.io_efd			= eventfd(0, 0),
2835ac1178bSAsias He 		.kvm			= kvm,
284427948d5SSasha Levin 	};
285427948d5SSasha Levin 
28602eca50cSAsias He 	virtio_init(kvm, bdev, &bdev->vdev, &blk_dev_virtio_ops,
287d97dadecSWill Deacon 		    VIRTIO_DEFAULT_TRANS(kvm), PCI_DEVICE_ID_VIRTIO_BLK,
288ae06ce71SWill Deacon 		    VIRTIO_ID_BLOCK, PCI_CLASS_BLK);
289b30d05adSPekka Enberg 
290ebe9ac19SSasha Levin 	list_add_tail(&bdev->list, &bdevs);
291ebe9ac19SSasha Levin 
2922fddfdb5SAsias He 	for (i = 0; i < ARRAY_SIZE(bdev->reqs); i++) {
2932fddfdb5SAsias He 		bdev->reqs[i].bdev = bdev;
2942fddfdb5SAsias He 		bdev->reqs[i].kvm = kvm;
2952fddfdb5SAsias He 	}
2968b52f877SSasha Levin 
297fb434ac3SSasha Levin 	disk_image__set_callback(bdev->disk, virtio_blk_complete);
298fb434ac3SSasha Levin 
2995ac1178bSAsias He 	pthread_create(&bdev->io_thread, NULL, virtio_blk_thread, bdev);
300d278197dSAsias He 	if (compat_id == -1)
30152f34d2cSAsias He 		compat_id = virtio_compat_add_message("virtio-blk", "CONFIG_VIRTIO_BLK");
3025ac1178bSAsias He 
3039f9207c5SSasha Levin 	return 0;
304b30d05adSPekka Enberg }
305bcb6aacaSPrasad Joshi 
3069f9207c5SSasha Levin static int virtio_blk__exit_one(struct kvm *kvm, struct blk_dev *bdev)
307bcb6aacaSPrasad Joshi {
3089f9207c5SSasha Levin 	list_del(&bdev->list);
3099f9207c5SSasha Levin 	free(bdev);
310bcb6aacaSPrasad Joshi 
3119f9207c5SSasha Levin 	return 0;
312bcb6aacaSPrasad Joshi }
313a0a1e3c2SPrasad Joshi 
3149f9207c5SSasha Levin int virtio_blk__init(struct kvm *kvm)
3159f9207c5SSasha Levin {
3169f9207c5SSasha Levin 	int i, r = 0;
3179f9207c5SSasha Levin 
3189f9207c5SSasha Levin 	for (i = 0; i < kvm->nr_disks; i++) {
319a67da3beSAsias He 		if (kvm->disks[i]->wwpn)
320a67da3beSAsias He 			continue;
3219f9207c5SSasha Levin 		r = virtio_blk__init_one(kvm, kvm->disks[i]);
3229f9207c5SSasha Levin 		if (r < 0)
3239f9207c5SSasha Levin 			goto cleanup;
3249f9207c5SSasha Levin 	}
3259f9207c5SSasha Levin 
3269f9207c5SSasha Levin 	return 0;
3279f9207c5SSasha Levin cleanup:
3289f9207c5SSasha Levin 	return virtio_blk__exit(kvm);
3299f9207c5SSasha Levin }
33049a8afd1SSasha Levin virtio_dev_init(virtio_blk__init);
3319f9207c5SSasha Levin 
3329f9207c5SSasha Levin int virtio_blk__exit(struct kvm *kvm)
333a0a1e3c2SPrasad Joshi {
334ebe9ac19SSasha Levin 	while (!list_empty(&bdevs)) {
335ebe9ac19SSasha Levin 		struct blk_dev *bdev;
336a0a1e3c2SPrasad Joshi 
337ebe9ac19SSasha Levin 		bdev = list_first_entry(&bdevs, struct blk_dev, list);
3389f9207c5SSasha Levin 		virtio_blk__exit_one(kvm, bdev);
339ebe9ac19SSasha Levin 	}
3409f9207c5SSasha Levin 
3419f9207c5SSasha Levin 	return 0;
342a0a1e3c2SPrasad Joshi }
34349a8afd1SSasha Levin virtio_dev_exit(virtio_blk__exit);
344