xref: /kvmtool/virtio/vsock.c (revision 609ee9066879f2ff7138c825588a4bc5d2f83658)
1117d6495STianjia Zhang #include "kvm/virtio-vsock.h"
2117d6495STianjia Zhang #include "kvm/virtio-pci-dev.h"
3117d6495STianjia Zhang #include "kvm/kvm.h"
4117d6495STianjia Zhang #include "kvm/pci.h"
5117d6495STianjia Zhang #include "kvm/ioeventfd.h"
6117d6495STianjia Zhang #include "kvm/guest_compat.h"
7117d6495STianjia Zhang #include "kvm/virtio-pci.h"
8117d6495STianjia Zhang #include "kvm/virtio.h"
9117d6495STianjia Zhang 
10117d6495STianjia Zhang #include <linux/kernel.h>
11117d6495STianjia Zhang #include <linux/virtio_vsock.h>
12117d6495STianjia Zhang #include <linux/vhost.h>
13117d6495STianjia Zhang 
14117d6495STianjia Zhang #define VIRTIO_VSOCK_QUEUE_SIZE		128
15117d6495STianjia Zhang 
16117d6495STianjia Zhang static LIST_HEAD(vdevs);
17117d6495STianjia Zhang static int compat_id = -1;
18117d6495STianjia Zhang 
19117d6495STianjia Zhang enum {
20117d6495STianjia Zhang 	VSOCK_VQ_RX     = 0, /* for host to guest data */
21117d6495STianjia Zhang 	VSOCK_VQ_TX     = 1, /* for guest to host data */
22117d6495STianjia Zhang 	VSOCK_VQ_EVENT  = 2,
23117d6495STianjia Zhang 	VSOCK_VQ_MAX    = 3,
24117d6495STianjia Zhang };
25117d6495STianjia Zhang 
26117d6495STianjia Zhang struct vsock_dev {
27117d6495STianjia Zhang 	struct virt_queue		vqs[VSOCK_VQ_MAX];
28117d6495STianjia Zhang 	struct virtio_vsock_config	config;
29117d6495STianjia Zhang 	u32				features;
30117d6495STianjia Zhang 	int				vhost_fd;
31117d6495STianjia Zhang 	struct virtio_device		vdev;
32117d6495STianjia Zhang 	struct list_head		list;
33117d6495STianjia Zhang 	struct kvm			*kvm;
34117d6495STianjia Zhang };
35117d6495STianjia Zhang 
36117d6495STianjia Zhang static u8 *get_config(struct kvm *kvm, void *dev)
37117d6495STianjia Zhang {
38117d6495STianjia Zhang 	struct vsock_dev *vdev = dev;
39117d6495STianjia Zhang 
40117d6495STianjia Zhang 	return ((u8 *)(&vdev->config));
41117d6495STianjia Zhang }
42117d6495STianjia Zhang 
43e4730284SMartin Radev static size_t get_config_size(struct kvm *kvm, void *dev)
44e4730284SMartin Radev {
45e4730284SMartin Radev 	struct vsock_dev *vdev = dev;
46e4730284SMartin Radev 
47e4730284SMartin Radev 	return sizeof(vdev->config);
48e4730284SMartin Radev }
49e4730284SMartin Radev 
50117d6495STianjia Zhang static u32 get_host_features(struct kvm *kvm, void *dev)
51117d6495STianjia Zhang {
52117d6495STianjia Zhang 	return 1UL << VIRTIO_RING_F_EVENT_IDX
53117d6495STianjia Zhang 		| 1UL << VIRTIO_RING_F_INDIRECT_DESC;
54117d6495STianjia Zhang }
55117d6495STianjia Zhang 
56117d6495STianjia Zhang static void set_guest_features(struct kvm *kvm, void *dev, u32 features)
57117d6495STianjia Zhang {
58117d6495STianjia Zhang 	struct vsock_dev *vdev = dev;
59117d6495STianjia Zhang 
60117d6495STianjia Zhang 	vdev->features = features;
61117d6495STianjia Zhang }
62117d6495STianjia Zhang 
63117d6495STianjia Zhang static bool is_event_vq(u32 vq)
64117d6495STianjia Zhang {
65117d6495STianjia Zhang 	return vq == VSOCK_VQ_EVENT;
66117d6495STianjia Zhang }
67117d6495STianjia Zhang 
68*609ee906SJean-Philippe Brucker static int init_vq(struct kvm *kvm, void *dev, u32 vq)
69117d6495STianjia Zhang {
70117d6495STianjia Zhang 	struct vhost_vring_state state = { .index = vq };
71117d6495STianjia Zhang 	struct vhost_vring_addr addr;
72117d6495STianjia Zhang 	struct vsock_dev *vdev = dev;
73117d6495STianjia Zhang 	struct virt_queue *queue;
74117d6495STianjia Zhang 	int r;
75117d6495STianjia Zhang 
76117d6495STianjia Zhang 	compat__remove_message(compat_id);
77117d6495STianjia Zhang 
78117d6495STianjia Zhang 	queue		= &vdev->vqs[vq];
79*609ee906SJean-Philippe Brucker 	virtio_init_device_vq(kvm, &vdev->vdev, queue, VIRTIO_VSOCK_QUEUE_SIZE);
80117d6495STianjia Zhang 
81117d6495STianjia Zhang 	if (vdev->vhost_fd == -1)
82117d6495STianjia Zhang 		return 0;
83117d6495STianjia Zhang 
84117d6495STianjia Zhang 	if (is_event_vq(vq))
85117d6495STianjia Zhang 		return 0;
86117d6495STianjia Zhang 
87117d6495STianjia Zhang 	state.num = queue->vring.num;
88117d6495STianjia Zhang 	r = ioctl(vdev->vhost_fd, VHOST_SET_VRING_NUM, &state);
89117d6495STianjia Zhang 	if (r < 0)
90117d6495STianjia Zhang 		die_perror("VHOST_SET_VRING_NUM failed");
91117d6495STianjia Zhang 
92117d6495STianjia Zhang 	state.num = 0;
93117d6495STianjia Zhang 	r = ioctl(vdev->vhost_fd, VHOST_SET_VRING_BASE, &state);
94117d6495STianjia Zhang 	if (r < 0)
95117d6495STianjia Zhang 		die_perror("VHOST_SET_VRING_BASE failed");
96117d6495STianjia Zhang 
97117d6495STianjia Zhang 	addr = (struct vhost_vring_addr) {
98117d6495STianjia Zhang 		.index = vq,
99117d6495STianjia Zhang 		.desc_user_addr = (u64)(unsigned long)queue->vring.desc,
100117d6495STianjia Zhang 		.avail_user_addr = (u64)(unsigned long)queue->vring.avail,
101117d6495STianjia Zhang 		.used_user_addr = (u64)(unsigned long)queue->vring.used,
102117d6495STianjia Zhang 	};
103117d6495STianjia Zhang 
104117d6495STianjia Zhang 	r = ioctl(vdev->vhost_fd, VHOST_SET_VRING_ADDR, &addr);
105117d6495STianjia Zhang 	if (r < 0)
106117d6495STianjia Zhang 		die_perror("VHOST_SET_VRING_ADDR failed");
107117d6495STianjia Zhang 
108117d6495STianjia Zhang 	return 0;
109117d6495STianjia Zhang }
110117d6495STianjia Zhang 
111117d6495STianjia Zhang static void notify_vq_eventfd(struct kvm *kvm, void *dev, u32 vq, u32 efd)
112117d6495STianjia Zhang {
113117d6495STianjia Zhang 	struct vsock_dev *vdev = dev;
114117d6495STianjia Zhang 	struct vhost_vring_file file = {
115117d6495STianjia Zhang 		.index	= vq,
116117d6495STianjia Zhang 		.fd	= efd,
117117d6495STianjia Zhang 	};
118117d6495STianjia Zhang 	int r;
119117d6495STianjia Zhang 
120117d6495STianjia Zhang 	if (is_event_vq(vq))
121117d6495STianjia Zhang 		return;
122117d6495STianjia Zhang 
123117d6495STianjia Zhang 	if (vdev->vhost_fd == -1)
124117d6495STianjia Zhang 		return;
125117d6495STianjia Zhang 
126117d6495STianjia Zhang 	r = ioctl(vdev->vhost_fd, VHOST_SET_VRING_KICK, &file);
127117d6495STianjia Zhang 	if (r < 0)
128117d6495STianjia Zhang 		die_perror("VHOST_SET_VRING_KICK failed");
129117d6495STianjia Zhang }
130117d6495STianjia Zhang 
131117d6495STianjia Zhang static void notify_status(struct kvm *kvm, void *dev, u32 status)
132117d6495STianjia Zhang {
133117d6495STianjia Zhang 	struct vsock_dev *vdev = dev;
134117d6495STianjia Zhang 	int r, start;
135117d6495STianjia Zhang 
136a8e397bbSJean-Philippe Brucker 	if (status & VIRTIO__STATUS_START)
137a8e397bbSJean-Philippe Brucker 		start = 1;
138a8e397bbSJean-Philippe Brucker 	else if (status & VIRTIO__STATUS_STOP)
139a8e397bbSJean-Philippe Brucker 		start = 0;
140a8e397bbSJean-Philippe Brucker 	else
141117d6495STianjia Zhang 		return;
142117d6495STianjia Zhang 
143117d6495STianjia Zhang 	r = ioctl(vdev->vhost_fd, VHOST_VSOCK_SET_RUNNING, &start);
144117d6495STianjia Zhang 	if (r != 0)
145117d6495STianjia Zhang 		die("VHOST_VSOCK_SET_RUNNING failed %d", errno);
146117d6495STianjia Zhang }
147117d6495STianjia Zhang 
148117d6495STianjia Zhang static int notify_vq(struct kvm *kvm, void *dev, u32 vq)
149117d6495STianjia Zhang {
150117d6495STianjia Zhang 	return 0;
151117d6495STianjia Zhang }
152117d6495STianjia Zhang 
153117d6495STianjia Zhang static struct virt_queue *get_vq(struct kvm *kvm, void *dev, u32 vq)
154117d6495STianjia Zhang {
155117d6495STianjia Zhang 	struct vsock_dev *vdev = dev;
156117d6495STianjia Zhang 
157117d6495STianjia Zhang 	return &vdev->vqs[vq];
158117d6495STianjia Zhang }
159117d6495STianjia Zhang 
160117d6495STianjia Zhang static int get_size_vq(struct kvm *kvm, void *dev, u32 vq)
161117d6495STianjia Zhang {
162117d6495STianjia Zhang 	return VIRTIO_VSOCK_QUEUE_SIZE;
163117d6495STianjia Zhang }
164117d6495STianjia Zhang 
165117d6495STianjia Zhang static int set_size_vq(struct kvm *kvm, void *dev, u32 vq, int size)
166117d6495STianjia Zhang {
167117d6495STianjia Zhang 	return size;
168117d6495STianjia Zhang }
169117d6495STianjia Zhang 
170117d6495STianjia Zhang static void notify_vq_gsi(struct kvm *kvm, void *dev, u32 vq, u32 gsi)
171117d6495STianjia Zhang {
172117d6495STianjia Zhang 	struct vhost_vring_file file;
173117d6495STianjia Zhang 	struct vsock_dev *vdev = dev;
174117d6495STianjia Zhang 	struct kvm_irqfd irq;
175117d6495STianjia Zhang 	int r;
176117d6495STianjia Zhang 
177117d6495STianjia Zhang 	if (vdev->vhost_fd == -1)
178117d6495STianjia Zhang 		return;
179117d6495STianjia Zhang 
180117d6495STianjia Zhang 	if (is_event_vq(vq))
181117d6495STianjia Zhang 		return;
182117d6495STianjia Zhang 
183117d6495STianjia Zhang 	irq = (struct kvm_irqfd) {
184117d6495STianjia Zhang 		.gsi	= gsi,
185117d6495STianjia Zhang 		.fd	= eventfd(0, 0),
186117d6495STianjia Zhang 	};
187117d6495STianjia Zhang 	file = (struct vhost_vring_file) {
188117d6495STianjia Zhang 		.index	= vq,
189117d6495STianjia Zhang 		.fd	= irq.fd,
190117d6495STianjia Zhang 	};
191117d6495STianjia Zhang 
192117d6495STianjia Zhang 	r = ioctl(kvm->vm_fd, KVM_IRQFD, &irq);
193117d6495STianjia Zhang 	if (r < 0)
194117d6495STianjia Zhang 		die_perror("KVM_IRQFD failed");
195117d6495STianjia Zhang 
196117d6495STianjia Zhang 	r = ioctl(vdev->vhost_fd, VHOST_SET_VRING_CALL, &file);
197117d6495STianjia Zhang 	if (r < 0)
198117d6495STianjia Zhang 		die_perror("VHOST_SET_VRING_CALL failed");
199117d6495STianjia Zhang }
200117d6495STianjia Zhang 
20131e0eaccSMartin Radev static unsigned int get_vq_count(struct kvm *kvm, void *dev)
202117d6495STianjia Zhang {
203117d6495STianjia Zhang 	return VSOCK_VQ_MAX;
204117d6495STianjia Zhang }
205117d6495STianjia Zhang 
206117d6495STianjia Zhang static struct virtio_ops vsock_dev_virtio_ops = {
207117d6495STianjia Zhang 	.get_config		= get_config,
208e4730284SMartin Radev 	.get_config_size	= get_config_size,
209117d6495STianjia Zhang 	.get_host_features	= get_host_features,
210117d6495STianjia Zhang 	.set_guest_features	= set_guest_features,
211117d6495STianjia Zhang 	.init_vq		= init_vq,
212117d6495STianjia Zhang 	.get_vq			= get_vq,
213117d6495STianjia Zhang 	.get_size_vq		= get_size_vq,
214117d6495STianjia Zhang 	.set_size_vq		= set_size_vq,
215117d6495STianjia Zhang 	.notify_vq_eventfd	= notify_vq_eventfd,
216117d6495STianjia Zhang 	.notify_status		= notify_status,
217117d6495STianjia Zhang 	.notify_vq_gsi		= notify_vq_gsi,
218117d6495STianjia Zhang 	.notify_vq		= notify_vq,
219117d6495STianjia Zhang 	.get_vq_count		= get_vq_count,
220117d6495STianjia Zhang };
221117d6495STianjia Zhang 
222117d6495STianjia Zhang static void virtio_vhost_vsock_init(struct kvm *kvm, struct vsock_dev *vdev)
223117d6495STianjia Zhang {
224117d6495STianjia Zhang 	struct kvm_mem_bank *bank;
225117d6495STianjia Zhang 	struct vhost_memory *mem;
226117d6495STianjia Zhang 	u64 features;
227117d6495STianjia Zhang 	int r, i;
228117d6495STianjia Zhang 
229117d6495STianjia Zhang 	vdev->vhost_fd = open("/dev/vhost-vsock", O_RDWR);
230117d6495STianjia Zhang 	if (vdev->vhost_fd < 0)
231117d6495STianjia Zhang 		die_perror("Failed opening vhost-vsock device");
232117d6495STianjia Zhang 
233117d6495STianjia Zhang 	mem = calloc(1, sizeof(*mem) + sizeof(struct vhost_memory_region));
234117d6495STianjia Zhang 	if (mem == NULL)
235117d6495STianjia Zhang 		die("Failed allocating memory for vhost memory map");
236117d6495STianjia Zhang 
237117d6495STianjia Zhang 	i = 0;
238117d6495STianjia Zhang 	list_for_each_entry(bank, &kvm->mem_banks, list) {
239117d6495STianjia Zhang 		mem->regions[i] = (struct vhost_memory_region) {
240117d6495STianjia Zhang 			.guest_phys_addr = bank->guest_phys_addr,
241117d6495STianjia Zhang 			.memory_size	 = bank->size,
242117d6495STianjia Zhang 			.userspace_addr	 = (unsigned long)bank->host_addr,
243117d6495STianjia Zhang 		};
244117d6495STianjia Zhang 		i++;
245117d6495STianjia Zhang 	}
246117d6495STianjia Zhang 	mem->nregions = i;
247117d6495STianjia Zhang 
248117d6495STianjia Zhang 	r = ioctl(vdev->vhost_fd, VHOST_SET_OWNER);
249117d6495STianjia Zhang 	if (r != 0)
250117d6495STianjia Zhang 		die_perror("VHOST_SET_OWNER failed");
251117d6495STianjia Zhang 
252117d6495STianjia Zhang 	r = ioctl(vdev->vhost_fd, VHOST_SET_MEM_TABLE, mem);
253117d6495STianjia Zhang 	if (r != 0)
254117d6495STianjia Zhang 		die_perror("VHOST_SET_MEM_TABLE failed");
255117d6495STianjia Zhang 
256117d6495STianjia Zhang 	r = ioctl(vdev->vhost_fd, VHOST_GET_FEATURES, &features);
257117d6495STianjia Zhang 	if (r != 0)
258117d6495STianjia Zhang 		die_perror("VHOST_GET_FEATURES failed");
259117d6495STianjia Zhang 
260117d6495STianjia Zhang 	r = ioctl(vdev->vhost_fd, VHOST_SET_FEATURES, &features);
261117d6495STianjia Zhang 	if (r != 0)
262117d6495STianjia Zhang 		die_perror("VHOST_SET_FEATURES failed");
263117d6495STianjia Zhang 
264117d6495STianjia Zhang 	r = ioctl(vdev->vhost_fd, VHOST_VSOCK_SET_GUEST_CID, &vdev->config.guest_cid);
265117d6495STianjia Zhang 	if (r != 0)
266117d6495STianjia Zhang 		die_perror("VHOST_VSOCK_SET_GUEST_CID failed");
267117d6495STianjia Zhang 
268117d6495STianjia Zhang 	vdev->vdev.use_vhost = true;
269117d6495STianjia Zhang 
270117d6495STianjia Zhang 	free(mem);
271117d6495STianjia Zhang }
272117d6495STianjia Zhang 
273117d6495STianjia Zhang static int virtio_vsock_init_one(struct kvm *kvm, u64 guest_cid)
274117d6495STianjia Zhang {
275117d6495STianjia Zhang 	struct vsock_dev *vdev;
276117d6495STianjia Zhang 	int r;
277117d6495STianjia Zhang 
278117d6495STianjia Zhang 	vdev = calloc(1, sizeof(struct vsock_dev));
279117d6495STianjia Zhang 	if (vdev == NULL)
280117d6495STianjia Zhang 		return -ENOMEM;
281117d6495STianjia Zhang 
282117d6495STianjia Zhang 	*vdev = (struct vsock_dev) {
283117d6495STianjia Zhang 		.config	= (struct virtio_vsock_config) {
284117d6495STianjia Zhang 			.guest_cid	= guest_cid,
285117d6495STianjia Zhang 		},
286117d6495STianjia Zhang 		.vhost_fd		= -1,
287117d6495STianjia Zhang 		.kvm			= kvm,
288117d6495STianjia Zhang 	};
289117d6495STianjia Zhang 
290117d6495STianjia Zhang 	list_add_tail(&vdev->list, &vdevs);
291117d6495STianjia Zhang 
292117d6495STianjia Zhang 	r = virtio_init(kvm, vdev, &vdev->vdev, &vsock_dev_virtio_ops,
293117d6495STianjia Zhang 		    VIRTIO_DEFAULT_TRANS(kvm), PCI_DEVICE_ID_VIRTIO_VSOCK,
294117d6495STianjia Zhang 		    VIRTIO_ID_VSOCK, PCI_CLASS_VSOCK);
295117d6495STianjia Zhang 	if (r < 0)
296117d6495STianjia Zhang 	    return r;
297117d6495STianjia Zhang 
298117d6495STianjia Zhang 	virtio_vhost_vsock_init(kvm, vdev);
299117d6495STianjia Zhang 
300117d6495STianjia Zhang 	if (compat_id == -1)
301117d6495STianjia Zhang 		compat_id = virtio_compat_add_message("virtio-vsock", "CONFIG_VIRTIO_VSOCK");
302117d6495STianjia Zhang 
303117d6495STianjia Zhang 	return 0;
304117d6495STianjia Zhang }
305117d6495STianjia Zhang 
306117d6495STianjia Zhang static int virtio_vsock_exit_one(struct kvm *kvm, struct vsock_dev *vdev)
307117d6495STianjia Zhang {
308117d6495STianjia Zhang 	list_del(&vdev->list);
309117d6495STianjia Zhang 	free(vdev);
310117d6495STianjia Zhang 
311117d6495STianjia Zhang 	return 0;
312117d6495STianjia Zhang }
313117d6495STianjia Zhang 
314117d6495STianjia Zhang int virtio_vsock_init(struct kvm *kvm)
315117d6495STianjia Zhang {
316117d6495STianjia Zhang 	int r;
317117d6495STianjia Zhang 
318117d6495STianjia Zhang 	if (kvm->cfg.vsock_cid == 0)
319117d6495STianjia Zhang 		return 0;
320117d6495STianjia Zhang 
321117d6495STianjia Zhang 	r = virtio_vsock_init_one(kvm, kvm->cfg.vsock_cid);
322117d6495STianjia Zhang 	if (r < 0)
323117d6495STianjia Zhang 		goto cleanup;
324117d6495STianjia Zhang 
325117d6495STianjia Zhang 	return 0;
326117d6495STianjia Zhang cleanup:
327117d6495STianjia Zhang 	return virtio_vsock_exit(kvm);
328117d6495STianjia Zhang }
329117d6495STianjia Zhang virtio_dev_init(virtio_vsock_init);
330117d6495STianjia Zhang 
331117d6495STianjia Zhang int virtio_vsock_exit(struct kvm *kvm)
332117d6495STianjia Zhang {
333117d6495STianjia Zhang 	while (!list_empty(&vdevs)) {
334117d6495STianjia Zhang 		struct vsock_dev *vdev;
335117d6495STianjia Zhang 
336117d6495STianjia Zhang 		vdev = list_first_entry(&vdevs, struct vsock_dev, list);
337117d6495STianjia Zhang 		virtio_vsock_exit_one(kvm, vdev);
338117d6495STianjia Zhang 	}
339117d6495STianjia Zhang 
340117d6495STianjia Zhang 	return 0;
341117d6495STianjia Zhang }
342117d6495STianjia Zhang virtio_dev_exit(virtio_vsock_exit);
343