xref: /kvmtool/virtio/vsock.c (revision f84ab9eb74fcd7db332c5b915c7d60cae44f8958)
1117d6495STianjia Zhang #include "kvm/virtio-vsock.h"
2117d6495STianjia Zhang #include "kvm/virtio-pci-dev.h"
3117d6495STianjia Zhang #include "kvm/kvm.h"
4117d6495STianjia Zhang #include "kvm/pci.h"
5117d6495STianjia Zhang #include "kvm/ioeventfd.h"
6117d6495STianjia Zhang #include "kvm/guest_compat.h"
7117d6495STianjia Zhang #include "kvm/virtio-pci.h"
8117d6495STianjia Zhang #include "kvm/virtio.h"
9117d6495STianjia Zhang 
10867b15ccSJean-Philippe Brucker #include <linux/byteorder.h>
11117d6495STianjia Zhang #include <linux/kernel.h>
12117d6495STianjia Zhang #include <linux/virtio_vsock.h>
13117d6495STianjia Zhang #include <linux/vhost.h>
14117d6495STianjia Zhang 
15117d6495STianjia Zhang #define VIRTIO_VSOCK_QUEUE_SIZE		128
16117d6495STianjia Zhang 
17117d6495STianjia Zhang static LIST_HEAD(vdevs);
18117d6495STianjia Zhang static int compat_id = -1;
19117d6495STianjia Zhang 
20117d6495STianjia Zhang enum {
21117d6495STianjia Zhang 	VSOCK_VQ_RX     = 0, /* for host to guest data */
22117d6495STianjia Zhang 	VSOCK_VQ_TX     = 1, /* for guest to host data */
23117d6495STianjia Zhang 	VSOCK_VQ_EVENT  = 2,
24117d6495STianjia Zhang 	VSOCK_VQ_MAX    = 3,
25117d6495STianjia Zhang };
26117d6495STianjia Zhang 
27117d6495STianjia Zhang struct vsock_dev {
28117d6495STianjia Zhang 	struct virt_queue		vqs[VSOCK_VQ_MAX];
29117d6495STianjia Zhang 	struct virtio_vsock_config	config;
30867b15ccSJean-Philippe Brucker 	u64				guest_cid;
31117d6495STianjia Zhang 	u32				features;
32117d6495STianjia Zhang 	int				vhost_fd;
33117d6495STianjia Zhang 	struct virtio_device		vdev;
34117d6495STianjia Zhang 	struct list_head		list;
35117d6495STianjia Zhang 	struct kvm			*kvm;
36117d6495STianjia Zhang };
37117d6495STianjia Zhang 
38117d6495STianjia Zhang static u8 *get_config(struct kvm *kvm, void *dev)
39117d6495STianjia Zhang {
40117d6495STianjia Zhang 	struct vsock_dev *vdev = dev;
41117d6495STianjia Zhang 
42117d6495STianjia Zhang 	return ((u8 *)(&vdev->config));
43117d6495STianjia Zhang }
44117d6495STianjia Zhang 
45e4730284SMartin Radev static size_t get_config_size(struct kvm *kvm, void *dev)
46e4730284SMartin Radev {
47e4730284SMartin Radev 	struct vsock_dev *vdev = dev;
48e4730284SMartin Radev 
49e4730284SMartin Radev 	return sizeof(vdev->config);
50e4730284SMartin Radev }
51e4730284SMartin Radev 
523c8f82b8SJean-Philippe Brucker static u64 get_host_features(struct kvm *kvm, void *dev)
53117d6495STianjia Zhang {
54117d6495STianjia Zhang 	return 1UL << VIRTIO_RING_F_EVENT_IDX
55117d6495STianjia Zhang 		| 1UL << VIRTIO_RING_F_INDIRECT_DESC;
56117d6495STianjia Zhang }
57117d6495STianjia Zhang 
58117d6495STianjia Zhang static bool is_event_vq(u32 vq)
59117d6495STianjia Zhang {
60117d6495STianjia Zhang 	return vq == VSOCK_VQ_EVENT;
61117d6495STianjia Zhang }
62117d6495STianjia Zhang 
63609ee906SJean-Philippe Brucker static int init_vq(struct kvm *kvm, void *dev, u32 vq)
64117d6495STianjia Zhang {
65117d6495STianjia Zhang 	struct vhost_vring_state state = { .index = vq };
66117d6495STianjia Zhang 	struct vhost_vring_addr addr;
67117d6495STianjia Zhang 	struct vsock_dev *vdev = dev;
68117d6495STianjia Zhang 	struct virt_queue *queue;
69117d6495STianjia Zhang 	int r;
70117d6495STianjia Zhang 
71117d6495STianjia Zhang 	compat__remove_message(compat_id);
72117d6495STianjia Zhang 
73117d6495STianjia Zhang 	queue		= &vdev->vqs[vq];
74609ee906SJean-Philippe Brucker 	virtio_init_device_vq(kvm, &vdev->vdev, queue, VIRTIO_VSOCK_QUEUE_SIZE);
75117d6495STianjia Zhang 
76117d6495STianjia Zhang 	if (vdev->vhost_fd == -1)
77117d6495STianjia Zhang 		return 0;
78117d6495STianjia Zhang 
79117d6495STianjia Zhang 	if (is_event_vq(vq))
80117d6495STianjia Zhang 		return 0;
81117d6495STianjia Zhang 
82117d6495STianjia Zhang 	state.num = queue->vring.num;
83117d6495STianjia Zhang 	r = ioctl(vdev->vhost_fd, VHOST_SET_VRING_NUM, &state);
84117d6495STianjia Zhang 	if (r < 0)
85117d6495STianjia Zhang 		die_perror("VHOST_SET_VRING_NUM failed");
86117d6495STianjia Zhang 
87117d6495STianjia Zhang 	state.num = 0;
88117d6495STianjia Zhang 	r = ioctl(vdev->vhost_fd, VHOST_SET_VRING_BASE, &state);
89117d6495STianjia Zhang 	if (r < 0)
90117d6495STianjia Zhang 		die_perror("VHOST_SET_VRING_BASE failed");
91117d6495STianjia Zhang 
92117d6495STianjia Zhang 	addr = (struct vhost_vring_addr) {
93117d6495STianjia Zhang 		.index = vq,
94117d6495STianjia Zhang 		.desc_user_addr = (u64)(unsigned long)queue->vring.desc,
95117d6495STianjia Zhang 		.avail_user_addr = (u64)(unsigned long)queue->vring.avail,
96117d6495STianjia Zhang 		.used_user_addr = (u64)(unsigned long)queue->vring.used,
97117d6495STianjia Zhang 	};
98117d6495STianjia Zhang 
99117d6495STianjia Zhang 	r = ioctl(vdev->vhost_fd, VHOST_SET_VRING_ADDR, &addr);
100117d6495STianjia Zhang 	if (r < 0)
101117d6495STianjia Zhang 		die_perror("VHOST_SET_VRING_ADDR failed");
102117d6495STianjia Zhang 
103117d6495STianjia Zhang 	return 0;
104117d6495STianjia Zhang }
105117d6495STianjia Zhang 
106117d6495STianjia Zhang static void notify_vq_eventfd(struct kvm *kvm, void *dev, u32 vq, u32 efd)
107117d6495STianjia Zhang {
108117d6495STianjia Zhang 	struct vsock_dev *vdev = dev;
109117d6495STianjia Zhang 	struct vhost_vring_file file = {
110117d6495STianjia Zhang 		.index	= vq,
111117d6495STianjia Zhang 		.fd	= efd,
112117d6495STianjia Zhang 	};
113117d6495STianjia Zhang 	int r;
114117d6495STianjia Zhang 
115117d6495STianjia Zhang 	if (is_event_vq(vq))
116117d6495STianjia Zhang 		return;
117117d6495STianjia Zhang 
118117d6495STianjia Zhang 	if (vdev->vhost_fd == -1)
119117d6495STianjia Zhang 		return;
120117d6495STianjia Zhang 
121117d6495STianjia Zhang 	r = ioctl(vdev->vhost_fd, VHOST_SET_VRING_KICK, &file);
122117d6495STianjia Zhang 	if (r < 0)
123117d6495STianjia Zhang 		die_perror("VHOST_SET_VRING_KICK failed");
124117d6495STianjia Zhang }
125117d6495STianjia Zhang 
126117d6495STianjia Zhang static void notify_status(struct kvm *kvm, void *dev, u32 status)
127117d6495STianjia Zhang {
128117d6495STianjia Zhang 	struct vsock_dev *vdev = dev;
129117d6495STianjia Zhang 	int r, start;
130117d6495STianjia Zhang 
131867b15ccSJean-Philippe Brucker 	if (status & VIRTIO__STATUS_CONFIG)
132867b15ccSJean-Philippe Brucker 		vdev->config.guest_cid = cpu_to_le64(vdev->guest_cid);
133867b15ccSJean-Philippe Brucker 
134a8e397bbSJean-Philippe Brucker 	if (status & VIRTIO__STATUS_START)
135a8e397bbSJean-Philippe Brucker 		start = 1;
136a8e397bbSJean-Philippe Brucker 	else if (status & VIRTIO__STATUS_STOP)
137a8e397bbSJean-Philippe Brucker 		start = 0;
138a8e397bbSJean-Philippe Brucker 	else
139117d6495STianjia Zhang 		return;
140117d6495STianjia Zhang 
141117d6495STianjia Zhang 	r = ioctl(vdev->vhost_fd, VHOST_VSOCK_SET_RUNNING, &start);
142117d6495STianjia Zhang 	if (r != 0)
143117d6495STianjia Zhang 		die("VHOST_VSOCK_SET_RUNNING failed %d", errno);
144117d6495STianjia Zhang }
145117d6495STianjia Zhang 
146117d6495STianjia Zhang static int notify_vq(struct kvm *kvm, void *dev, u32 vq)
147117d6495STianjia Zhang {
148117d6495STianjia Zhang 	return 0;
149117d6495STianjia Zhang }
150117d6495STianjia Zhang 
151117d6495STianjia Zhang static struct virt_queue *get_vq(struct kvm *kvm, void *dev, u32 vq)
152117d6495STianjia Zhang {
153117d6495STianjia Zhang 	struct vsock_dev *vdev = dev;
154117d6495STianjia Zhang 
155117d6495STianjia Zhang 	return &vdev->vqs[vq];
156117d6495STianjia Zhang }
157117d6495STianjia Zhang 
158117d6495STianjia Zhang static int get_size_vq(struct kvm *kvm, void *dev, u32 vq)
159117d6495STianjia Zhang {
160117d6495STianjia Zhang 	return VIRTIO_VSOCK_QUEUE_SIZE;
161117d6495STianjia Zhang }
162117d6495STianjia Zhang 
163117d6495STianjia Zhang static int set_size_vq(struct kvm *kvm, void *dev, u32 vq, int size)
164117d6495STianjia Zhang {
165117d6495STianjia Zhang 	return size;
166117d6495STianjia Zhang }
167117d6495STianjia Zhang 
168117d6495STianjia Zhang static void notify_vq_gsi(struct kvm *kvm, void *dev, u32 vq, u32 gsi)
169117d6495STianjia Zhang {
170117d6495STianjia Zhang 	struct vhost_vring_file file;
171117d6495STianjia Zhang 	struct vsock_dev *vdev = dev;
172117d6495STianjia Zhang 	struct kvm_irqfd irq;
173117d6495STianjia Zhang 	int r;
174117d6495STianjia Zhang 
175117d6495STianjia Zhang 	if (vdev->vhost_fd == -1)
176117d6495STianjia Zhang 		return;
177117d6495STianjia Zhang 
178117d6495STianjia Zhang 	if (is_event_vq(vq))
179117d6495STianjia Zhang 		return;
180117d6495STianjia Zhang 
181117d6495STianjia Zhang 	irq = (struct kvm_irqfd) {
182117d6495STianjia Zhang 		.gsi	= gsi,
183117d6495STianjia Zhang 		.fd	= eventfd(0, 0),
184117d6495STianjia Zhang 	};
185117d6495STianjia Zhang 	file = (struct vhost_vring_file) {
186117d6495STianjia Zhang 		.index	= vq,
187117d6495STianjia Zhang 		.fd	= irq.fd,
188117d6495STianjia Zhang 	};
189117d6495STianjia Zhang 
190117d6495STianjia Zhang 	r = ioctl(kvm->vm_fd, KVM_IRQFD, &irq);
191117d6495STianjia Zhang 	if (r < 0)
192117d6495STianjia Zhang 		die_perror("KVM_IRQFD failed");
193117d6495STianjia Zhang 
194117d6495STianjia Zhang 	r = ioctl(vdev->vhost_fd, VHOST_SET_VRING_CALL, &file);
195117d6495STianjia Zhang 	if (r < 0)
196117d6495STianjia Zhang 		die_perror("VHOST_SET_VRING_CALL failed");
197117d6495STianjia Zhang }
198117d6495STianjia Zhang 
19931e0eaccSMartin Radev static unsigned int get_vq_count(struct kvm *kvm, void *dev)
200117d6495STianjia Zhang {
201117d6495STianjia Zhang 	return VSOCK_VQ_MAX;
202117d6495STianjia Zhang }
203117d6495STianjia Zhang 
204117d6495STianjia Zhang static struct virtio_ops vsock_dev_virtio_ops = {
205117d6495STianjia Zhang 	.get_config		= get_config,
206e4730284SMartin Radev 	.get_config_size	= get_config_size,
207117d6495STianjia Zhang 	.get_host_features	= get_host_features,
208117d6495STianjia Zhang 	.init_vq		= init_vq,
209117d6495STianjia Zhang 	.get_vq			= get_vq,
210117d6495STianjia Zhang 	.get_size_vq		= get_size_vq,
211117d6495STianjia Zhang 	.set_size_vq		= set_size_vq,
212117d6495STianjia Zhang 	.notify_vq_eventfd	= notify_vq_eventfd,
213117d6495STianjia Zhang 	.notify_status		= notify_status,
214117d6495STianjia Zhang 	.notify_vq_gsi		= notify_vq_gsi,
215117d6495STianjia Zhang 	.notify_vq		= notify_vq,
216117d6495STianjia Zhang 	.get_vq_count		= get_vq_count,
217117d6495STianjia Zhang };
218117d6495STianjia Zhang 
219117d6495STianjia Zhang static void virtio_vhost_vsock_init(struct kvm *kvm, struct vsock_dev *vdev)
220117d6495STianjia Zhang {
221117d6495STianjia Zhang 	u64 features;
222*f84ab9ebSJean-Philippe Brucker 	int r;
223117d6495STianjia Zhang 
224117d6495STianjia Zhang 	vdev->vhost_fd = open("/dev/vhost-vsock", O_RDWR);
225117d6495STianjia Zhang 	if (vdev->vhost_fd < 0)
226117d6495STianjia Zhang 		die_perror("Failed opening vhost-vsock device");
227117d6495STianjia Zhang 
228*f84ab9ebSJean-Philippe Brucker 	virtio_vhost_init(kvm, vdev->vhost_fd);
229117d6495STianjia Zhang 
230117d6495STianjia Zhang 	r = ioctl(vdev->vhost_fd, VHOST_GET_FEATURES, &features);
231117d6495STianjia Zhang 	if (r != 0)
232117d6495STianjia Zhang 		die_perror("VHOST_GET_FEATURES failed");
233117d6495STianjia Zhang 
234117d6495STianjia Zhang 	r = ioctl(vdev->vhost_fd, VHOST_SET_FEATURES, &features);
235117d6495STianjia Zhang 	if (r != 0)
236117d6495STianjia Zhang 		die_perror("VHOST_SET_FEATURES failed");
237117d6495STianjia Zhang 
238867b15ccSJean-Philippe Brucker 	r = ioctl(vdev->vhost_fd, VHOST_VSOCK_SET_GUEST_CID, &vdev->guest_cid);
239117d6495STianjia Zhang 	if (r != 0)
240117d6495STianjia Zhang 		die_perror("VHOST_VSOCK_SET_GUEST_CID failed");
241117d6495STianjia Zhang 
242117d6495STianjia Zhang 	vdev->vdev.use_vhost = true;
243117d6495STianjia Zhang }
244117d6495STianjia Zhang 
245117d6495STianjia Zhang static int virtio_vsock_init_one(struct kvm *kvm, u64 guest_cid)
246117d6495STianjia Zhang {
247117d6495STianjia Zhang 	struct vsock_dev *vdev;
248117d6495STianjia Zhang 	int r;
249117d6495STianjia Zhang 
250117d6495STianjia Zhang 	vdev = calloc(1, sizeof(struct vsock_dev));
251117d6495STianjia Zhang 	if (vdev == NULL)
252117d6495STianjia Zhang 		return -ENOMEM;
253117d6495STianjia Zhang 
254117d6495STianjia Zhang 	*vdev = (struct vsock_dev) {
255117d6495STianjia Zhang 		.guest_cid		= guest_cid,
256117d6495STianjia Zhang 		.vhost_fd		= -1,
257117d6495STianjia Zhang 		.kvm			= kvm,
258117d6495STianjia Zhang 	};
259117d6495STianjia Zhang 
260117d6495STianjia Zhang 	list_add_tail(&vdev->list, &vdevs);
261117d6495STianjia Zhang 
262117d6495STianjia Zhang 	r = virtio_init(kvm, vdev, &vdev->vdev, &vsock_dev_virtio_ops,
2639b46ebc5SRajnesh Kanwal 		    kvm->cfg.virtio_transport, PCI_DEVICE_ID_VIRTIO_VSOCK,
264117d6495STianjia Zhang 		    VIRTIO_ID_VSOCK, PCI_CLASS_VSOCK);
265117d6495STianjia Zhang 	if (r < 0)
266117d6495STianjia Zhang 	    return r;
267117d6495STianjia Zhang 
268117d6495STianjia Zhang 	virtio_vhost_vsock_init(kvm, vdev);
269117d6495STianjia Zhang 
270117d6495STianjia Zhang 	if (compat_id == -1)
271117d6495STianjia Zhang 		compat_id = virtio_compat_add_message("virtio-vsock", "CONFIG_VIRTIO_VSOCK");
272117d6495STianjia Zhang 
273117d6495STianjia Zhang 	return 0;
274117d6495STianjia Zhang }
275117d6495STianjia Zhang 
276117d6495STianjia Zhang static int virtio_vsock_exit_one(struct kvm *kvm, struct vsock_dev *vdev)
277117d6495STianjia Zhang {
278117d6495STianjia Zhang 	list_del(&vdev->list);
279117d6495STianjia Zhang 	free(vdev);
280117d6495STianjia Zhang 
281117d6495STianjia Zhang 	return 0;
282117d6495STianjia Zhang }
283117d6495STianjia Zhang 
284117d6495STianjia Zhang int virtio_vsock_init(struct kvm *kvm)
285117d6495STianjia Zhang {
286117d6495STianjia Zhang 	int r;
287117d6495STianjia Zhang 
288117d6495STianjia Zhang 	if (kvm->cfg.vsock_cid == 0)
289117d6495STianjia Zhang 		return 0;
290117d6495STianjia Zhang 
291117d6495STianjia Zhang 	r = virtio_vsock_init_one(kvm, kvm->cfg.vsock_cid);
292117d6495STianjia Zhang 	if (r < 0)
293117d6495STianjia Zhang 		goto cleanup;
294117d6495STianjia Zhang 
295117d6495STianjia Zhang 	return 0;
296117d6495STianjia Zhang cleanup:
297117d6495STianjia Zhang 	return virtio_vsock_exit(kvm);
298117d6495STianjia Zhang }
299117d6495STianjia Zhang virtio_dev_init(virtio_vsock_init);
300117d6495STianjia Zhang 
301117d6495STianjia Zhang int virtio_vsock_exit(struct kvm *kvm)
302117d6495STianjia Zhang {
303117d6495STianjia Zhang 	while (!list_empty(&vdevs)) {
304117d6495STianjia Zhang 		struct vsock_dev *vdev;
305117d6495STianjia Zhang 
306117d6495STianjia Zhang 		vdev = list_first_entry(&vdevs, struct vsock_dev, list);
307117d6495STianjia Zhang 		virtio_vsock_exit_one(kvm, vdev);
308117d6495STianjia Zhang 	}
309117d6495STianjia Zhang 
310117d6495STianjia Zhang 	return 0;
311117d6495STianjia Zhang }
312117d6495STianjia Zhang virtio_dev_exit(virtio_vsock_exit);
313