xref: /kvmtool/virtio/vsock.c (revision 867b15ccd7dae9ba7a174f97d4fe76e90a79d957)
1117d6495STianjia Zhang #include "kvm/virtio-vsock.h"
2117d6495STianjia Zhang #include "kvm/virtio-pci-dev.h"
3117d6495STianjia Zhang #include "kvm/kvm.h"
4117d6495STianjia Zhang #include "kvm/pci.h"
5117d6495STianjia Zhang #include "kvm/ioeventfd.h"
6117d6495STianjia Zhang #include "kvm/guest_compat.h"
7117d6495STianjia Zhang #include "kvm/virtio-pci.h"
8117d6495STianjia Zhang #include "kvm/virtio.h"
9117d6495STianjia Zhang 
10*867b15ccSJean-Philippe Brucker #include <linux/byteorder.h>
11117d6495STianjia Zhang #include <linux/kernel.h>
12117d6495STianjia Zhang #include <linux/virtio_vsock.h>
13117d6495STianjia Zhang #include <linux/vhost.h>
14117d6495STianjia Zhang 
15117d6495STianjia Zhang #define VIRTIO_VSOCK_QUEUE_SIZE		128
16117d6495STianjia Zhang 
17117d6495STianjia Zhang static LIST_HEAD(vdevs);
18117d6495STianjia Zhang static int compat_id = -1;
19117d6495STianjia Zhang 
20117d6495STianjia Zhang enum {
21117d6495STianjia Zhang 	VSOCK_VQ_RX     = 0, /* for host to guest data */
22117d6495STianjia Zhang 	VSOCK_VQ_TX     = 1, /* for guest to host data */
23117d6495STianjia Zhang 	VSOCK_VQ_EVENT  = 2,
24117d6495STianjia Zhang 	VSOCK_VQ_MAX    = 3,
25117d6495STianjia Zhang };
26117d6495STianjia Zhang 
27117d6495STianjia Zhang struct vsock_dev {
28117d6495STianjia Zhang 	struct virt_queue		vqs[VSOCK_VQ_MAX];
29117d6495STianjia Zhang 	struct virtio_vsock_config	config;
30*867b15ccSJean-Philippe Brucker 	u64				guest_cid;
31117d6495STianjia Zhang 	u32				features;
32117d6495STianjia Zhang 	int				vhost_fd;
33117d6495STianjia Zhang 	struct virtio_device		vdev;
34117d6495STianjia Zhang 	struct list_head		list;
35117d6495STianjia Zhang 	struct kvm			*kvm;
36117d6495STianjia Zhang };
37117d6495STianjia Zhang 
38117d6495STianjia Zhang static u8 *get_config(struct kvm *kvm, void *dev)
39117d6495STianjia Zhang {
40117d6495STianjia Zhang 	struct vsock_dev *vdev = dev;
41117d6495STianjia Zhang 
42117d6495STianjia Zhang 	return ((u8 *)(&vdev->config));
43117d6495STianjia Zhang }
44117d6495STianjia Zhang 
45e4730284SMartin Radev static size_t get_config_size(struct kvm *kvm, void *dev)
46e4730284SMartin Radev {
47e4730284SMartin Radev 	struct vsock_dev *vdev = dev;
48e4730284SMartin Radev 
49e4730284SMartin Radev 	return sizeof(vdev->config);
50e4730284SMartin Radev }
51e4730284SMartin Radev 
52117d6495STianjia Zhang static u32 get_host_features(struct kvm *kvm, void *dev)
53117d6495STianjia Zhang {
54117d6495STianjia Zhang 	return 1UL << VIRTIO_RING_F_EVENT_IDX
55117d6495STianjia Zhang 		| 1UL << VIRTIO_RING_F_INDIRECT_DESC;
56117d6495STianjia Zhang }
57117d6495STianjia Zhang 
58117d6495STianjia Zhang static void set_guest_features(struct kvm *kvm, void *dev, u32 features)
59117d6495STianjia Zhang {
60117d6495STianjia Zhang 	struct vsock_dev *vdev = dev;
61117d6495STianjia Zhang 
62117d6495STianjia Zhang 	vdev->features = features;
63117d6495STianjia Zhang }
64117d6495STianjia Zhang 
65117d6495STianjia Zhang static bool is_event_vq(u32 vq)
66117d6495STianjia Zhang {
67117d6495STianjia Zhang 	return vq == VSOCK_VQ_EVENT;
68117d6495STianjia Zhang }
69117d6495STianjia Zhang 
70609ee906SJean-Philippe Brucker static int init_vq(struct kvm *kvm, void *dev, u32 vq)
71117d6495STianjia Zhang {
72117d6495STianjia Zhang 	struct vhost_vring_state state = { .index = vq };
73117d6495STianjia Zhang 	struct vhost_vring_addr addr;
74117d6495STianjia Zhang 	struct vsock_dev *vdev = dev;
75117d6495STianjia Zhang 	struct virt_queue *queue;
76117d6495STianjia Zhang 	int r;
77117d6495STianjia Zhang 
78117d6495STianjia Zhang 	compat__remove_message(compat_id);
79117d6495STianjia Zhang 
80117d6495STianjia Zhang 	queue		= &vdev->vqs[vq];
81609ee906SJean-Philippe Brucker 	virtio_init_device_vq(kvm, &vdev->vdev, queue, VIRTIO_VSOCK_QUEUE_SIZE);
82117d6495STianjia Zhang 
83117d6495STianjia Zhang 	if (vdev->vhost_fd == -1)
84117d6495STianjia Zhang 		return 0;
85117d6495STianjia Zhang 
86117d6495STianjia Zhang 	if (is_event_vq(vq))
87117d6495STianjia Zhang 		return 0;
88117d6495STianjia Zhang 
89117d6495STianjia Zhang 	state.num = queue->vring.num;
90117d6495STianjia Zhang 	r = ioctl(vdev->vhost_fd, VHOST_SET_VRING_NUM, &state);
91117d6495STianjia Zhang 	if (r < 0)
92117d6495STianjia Zhang 		die_perror("VHOST_SET_VRING_NUM failed");
93117d6495STianjia Zhang 
94117d6495STianjia Zhang 	state.num = 0;
95117d6495STianjia Zhang 	r = ioctl(vdev->vhost_fd, VHOST_SET_VRING_BASE, &state);
96117d6495STianjia Zhang 	if (r < 0)
97117d6495STianjia Zhang 		die_perror("VHOST_SET_VRING_BASE failed");
98117d6495STianjia Zhang 
99117d6495STianjia Zhang 	addr = (struct vhost_vring_addr) {
100117d6495STianjia Zhang 		.index = vq,
101117d6495STianjia Zhang 		.desc_user_addr = (u64)(unsigned long)queue->vring.desc,
102117d6495STianjia Zhang 		.avail_user_addr = (u64)(unsigned long)queue->vring.avail,
103117d6495STianjia Zhang 		.used_user_addr = (u64)(unsigned long)queue->vring.used,
104117d6495STianjia Zhang 	};
105117d6495STianjia Zhang 
106117d6495STianjia Zhang 	r = ioctl(vdev->vhost_fd, VHOST_SET_VRING_ADDR, &addr);
107117d6495STianjia Zhang 	if (r < 0)
108117d6495STianjia Zhang 		die_perror("VHOST_SET_VRING_ADDR failed");
109117d6495STianjia Zhang 
110117d6495STianjia Zhang 	return 0;
111117d6495STianjia Zhang }
112117d6495STianjia Zhang 
113117d6495STianjia Zhang static void notify_vq_eventfd(struct kvm *kvm, void *dev, u32 vq, u32 efd)
114117d6495STianjia Zhang {
115117d6495STianjia Zhang 	struct vsock_dev *vdev = dev;
116117d6495STianjia Zhang 	struct vhost_vring_file file = {
117117d6495STianjia Zhang 		.index	= vq,
118117d6495STianjia Zhang 		.fd	= efd,
119117d6495STianjia Zhang 	};
120117d6495STianjia Zhang 	int r;
121117d6495STianjia Zhang 
122117d6495STianjia Zhang 	if (is_event_vq(vq))
123117d6495STianjia Zhang 		return;
124117d6495STianjia Zhang 
125117d6495STianjia Zhang 	if (vdev->vhost_fd == -1)
126117d6495STianjia Zhang 		return;
127117d6495STianjia Zhang 
128117d6495STianjia Zhang 	r = ioctl(vdev->vhost_fd, VHOST_SET_VRING_KICK, &file);
129117d6495STianjia Zhang 	if (r < 0)
130117d6495STianjia Zhang 		die_perror("VHOST_SET_VRING_KICK failed");
131117d6495STianjia Zhang }
132117d6495STianjia Zhang 
133117d6495STianjia Zhang static void notify_status(struct kvm *kvm, void *dev, u32 status)
134117d6495STianjia Zhang {
135117d6495STianjia Zhang 	struct vsock_dev *vdev = dev;
136117d6495STianjia Zhang 	int r, start;
137117d6495STianjia Zhang 
138*867b15ccSJean-Philippe Brucker 	if (status & VIRTIO__STATUS_CONFIG)
139*867b15ccSJean-Philippe Brucker 		vdev->config.guest_cid = cpu_to_le64(vdev->guest_cid);
140*867b15ccSJean-Philippe Brucker 
141a8e397bbSJean-Philippe Brucker 	if (status & VIRTIO__STATUS_START)
142a8e397bbSJean-Philippe Brucker 		start = 1;
143a8e397bbSJean-Philippe Brucker 	else if (status & VIRTIO__STATUS_STOP)
144a8e397bbSJean-Philippe Brucker 		start = 0;
145a8e397bbSJean-Philippe Brucker 	else
146117d6495STianjia Zhang 		return;
147117d6495STianjia Zhang 
148117d6495STianjia Zhang 	r = ioctl(vdev->vhost_fd, VHOST_VSOCK_SET_RUNNING, &start);
149117d6495STianjia Zhang 	if (r != 0)
150117d6495STianjia Zhang 		die("VHOST_VSOCK_SET_RUNNING failed %d", errno);
151117d6495STianjia Zhang }
152117d6495STianjia Zhang 
153117d6495STianjia Zhang static int notify_vq(struct kvm *kvm, void *dev, u32 vq)
154117d6495STianjia Zhang {
155117d6495STianjia Zhang 	return 0;
156117d6495STianjia Zhang }
157117d6495STianjia Zhang 
158117d6495STianjia Zhang static struct virt_queue *get_vq(struct kvm *kvm, void *dev, u32 vq)
159117d6495STianjia Zhang {
160117d6495STianjia Zhang 	struct vsock_dev *vdev = dev;
161117d6495STianjia Zhang 
162117d6495STianjia Zhang 	return &vdev->vqs[vq];
163117d6495STianjia Zhang }
164117d6495STianjia Zhang 
165117d6495STianjia Zhang static int get_size_vq(struct kvm *kvm, void *dev, u32 vq)
166117d6495STianjia Zhang {
167117d6495STianjia Zhang 	return VIRTIO_VSOCK_QUEUE_SIZE;
168117d6495STianjia Zhang }
169117d6495STianjia Zhang 
170117d6495STianjia Zhang static int set_size_vq(struct kvm *kvm, void *dev, u32 vq, int size)
171117d6495STianjia Zhang {
172117d6495STianjia Zhang 	return size;
173117d6495STianjia Zhang }
174117d6495STianjia Zhang 
175117d6495STianjia Zhang static void notify_vq_gsi(struct kvm *kvm, void *dev, u32 vq, u32 gsi)
176117d6495STianjia Zhang {
177117d6495STianjia Zhang 	struct vhost_vring_file file;
178117d6495STianjia Zhang 	struct vsock_dev *vdev = dev;
179117d6495STianjia Zhang 	struct kvm_irqfd irq;
180117d6495STianjia Zhang 	int r;
181117d6495STianjia Zhang 
182117d6495STianjia Zhang 	if (vdev->vhost_fd == -1)
183117d6495STianjia Zhang 		return;
184117d6495STianjia Zhang 
185117d6495STianjia Zhang 	if (is_event_vq(vq))
186117d6495STianjia Zhang 		return;
187117d6495STianjia Zhang 
188117d6495STianjia Zhang 	irq = (struct kvm_irqfd) {
189117d6495STianjia Zhang 		.gsi	= gsi,
190117d6495STianjia Zhang 		.fd	= eventfd(0, 0),
191117d6495STianjia Zhang 	};
192117d6495STianjia Zhang 	file = (struct vhost_vring_file) {
193117d6495STianjia Zhang 		.index	= vq,
194117d6495STianjia Zhang 		.fd	= irq.fd,
195117d6495STianjia Zhang 	};
196117d6495STianjia Zhang 
197117d6495STianjia Zhang 	r = ioctl(kvm->vm_fd, KVM_IRQFD, &irq);
198117d6495STianjia Zhang 	if (r < 0)
199117d6495STianjia Zhang 		die_perror("KVM_IRQFD failed");
200117d6495STianjia Zhang 
201117d6495STianjia Zhang 	r = ioctl(vdev->vhost_fd, VHOST_SET_VRING_CALL, &file);
202117d6495STianjia Zhang 	if (r < 0)
203117d6495STianjia Zhang 		die_perror("VHOST_SET_VRING_CALL failed");
204117d6495STianjia Zhang }
205117d6495STianjia Zhang 
20631e0eaccSMartin Radev static unsigned int get_vq_count(struct kvm *kvm, void *dev)
207117d6495STianjia Zhang {
208117d6495STianjia Zhang 	return VSOCK_VQ_MAX;
209117d6495STianjia Zhang }
210117d6495STianjia Zhang 
211117d6495STianjia Zhang static struct virtio_ops vsock_dev_virtio_ops = {
212117d6495STianjia Zhang 	.get_config		= get_config,
213e4730284SMartin Radev 	.get_config_size	= get_config_size,
214117d6495STianjia Zhang 	.get_host_features	= get_host_features,
215117d6495STianjia Zhang 	.set_guest_features	= set_guest_features,
216117d6495STianjia Zhang 	.init_vq		= init_vq,
217117d6495STianjia Zhang 	.get_vq			= get_vq,
218117d6495STianjia Zhang 	.get_size_vq		= get_size_vq,
219117d6495STianjia Zhang 	.set_size_vq		= set_size_vq,
220117d6495STianjia Zhang 	.notify_vq_eventfd	= notify_vq_eventfd,
221117d6495STianjia Zhang 	.notify_status		= notify_status,
222117d6495STianjia Zhang 	.notify_vq_gsi		= notify_vq_gsi,
223117d6495STianjia Zhang 	.notify_vq		= notify_vq,
224117d6495STianjia Zhang 	.get_vq_count		= get_vq_count,
225117d6495STianjia Zhang };
226117d6495STianjia Zhang 
227117d6495STianjia Zhang static void virtio_vhost_vsock_init(struct kvm *kvm, struct vsock_dev *vdev)
228117d6495STianjia Zhang {
229117d6495STianjia Zhang 	struct kvm_mem_bank *bank;
230117d6495STianjia Zhang 	struct vhost_memory *mem;
231117d6495STianjia Zhang 	u64 features;
232117d6495STianjia Zhang 	int r, i;
233117d6495STianjia Zhang 
234117d6495STianjia Zhang 	vdev->vhost_fd = open("/dev/vhost-vsock", O_RDWR);
235117d6495STianjia Zhang 	if (vdev->vhost_fd < 0)
236117d6495STianjia Zhang 		die_perror("Failed opening vhost-vsock device");
237117d6495STianjia Zhang 
238117d6495STianjia Zhang 	mem = calloc(1, sizeof(*mem) + sizeof(struct vhost_memory_region));
239117d6495STianjia Zhang 	if (mem == NULL)
240117d6495STianjia Zhang 		die("Failed allocating memory for vhost memory map");
241117d6495STianjia Zhang 
242117d6495STianjia Zhang 	i = 0;
243117d6495STianjia Zhang 	list_for_each_entry(bank, &kvm->mem_banks, list) {
244117d6495STianjia Zhang 		mem->regions[i] = (struct vhost_memory_region) {
245117d6495STianjia Zhang 			.guest_phys_addr = bank->guest_phys_addr,
246117d6495STianjia Zhang 			.memory_size	 = bank->size,
247117d6495STianjia Zhang 			.userspace_addr	 = (unsigned long)bank->host_addr,
248117d6495STianjia Zhang 		};
249117d6495STianjia Zhang 		i++;
250117d6495STianjia Zhang 	}
251117d6495STianjia Zhang 	mem->nregions = i;
252117d6495STianjia Zhang 
253117d6495STianjia Zhang 	r = ioctl(vdev->vhost_fd, VHOST_SET_OWNER);
254117d6495STianjia Zhang 	if (r != 0)
255117d6495STianjia Zhang 		die_perror("VHOST_SET_OWNER failed");
256117d6495STianjia Zhang 
257117d6495STianjia Zhang 	r = ioctl(vdev->vhost_fd, VHOST_SET_MEM_TABLE, mem);
258117d6495STianjia Zhang 	if (r != 0)
259117d6495STianjia Zhang 		die_perror("VHOST_SET_MEM_TABLE failed");
260117d6495STianjia Zhang 
261117d6495STianjia Zhang 	r = ioctl(vdev->vhost_fd, VHOST_GET_FEATURES, &features);
262117d6495STianjia Zhang 	if (r != 0)
263117d6495STianjia Zhang 		die_perror("VHOST_GET_FEATURES failed");
264117d6495STianjia Zhang 
265117d6495STianjia Zhang 	r = ioctl(vdev->vhost_fd, VHOST_SET_FEATURES, &features);
266117d6495STianjia Zhang 	if (r != 0)
267117d6495STianjia Zhang 		die_perror("VHOST_SET_FEATURES failed");
268117d6495STianjia Zhang 
269*867b15ccSJean-Philippe Brucker 	r = ioctl(vdev->vhost_fd, VHOST_VSOCK_SET_GUEST_CID, &vdev->guest_cid);
270117d6495STianjia Zhang 	if (r != 0)
271117d6495STianjia Zhang 		die_perror("VHOST_VSOCK_SET_GUEST_CID failed");
272117d6495STianjia Zhang 
273117d6495STianjia Zhang 	vdev->vdev.use_vhost = true;
274117d6495STianjia Zhang 
275117d6495STianjia Zhang 	free(mem);
276117d6495STianjia Zhang }
277117d6495STianjia Zhang 
278117d6495STianjia Zhang static int virtio_vsock_init_one(struct kvm *kvm, u64 guest_cid)
279117d6495STianjia Zhang {
280117d6495STianjia Zhang 	struct vsock_dev *vdev;
281117d6495STianjia Zhang 	int r;
282117d6495STianjia Zhang 
283117d6495STianjia Zhang 	vdev = calloc(1, sizeof(struct vsock_dev));
284117d6495STianjia Zhang 	if (vdev == NULL)
285117d6495STianjia Zhang 		return -ENOMEM;
286117d6495STianjia Zhang 
287117d6495STianjia Zhang 	*vdev = (struct vsock_dev) {
288117d6495STianjia Zhang 		.guest_cid		= guest_cid,
289117d6495STianjia Zhang 		.vhost_fd		= -1,
290117d6495STianjia Zhang 		.kvm			= kvm,
291117d6495STianjia Zhang 	};
292117d6495STianjia Zhang 
293117d6495STianjia Zhang 	list_add_tail(&vdev->list, &vdevs);
294117d6495STianjia Zhang 
295117d6495STianjia Zhang 	r = virtio_init(kvm, vdev, &vdev->vdev, &vsock_dev_virtio_ops,
296117d6495STianjia Zhang 		    VIRTIO_DEFAULT_TRANS(kvm), PCI_DEVICE_ID_VIRTIO_VSOCK,
297117d6495STianjia Zhang 		    VIRTIO_ID_VSOCK, PCI_CLASS_VSOCK);
298117d6495STianjia Zhang 	if (r < 0)
299117d6495STianjia Zhang 	    return r;
300117d6495STianjia Zhang 
301117d6495STianjia Zhang 	virtio_vhost_vsock_init(kvm, vdev);
302117d6495STianjia Zhang 
303117d6495STianjia Zhang 	if (compat_id == -1)
304117d6495STianjia Zhang 		compat_id = virtio_compat_add_message("virtio-vsock", "CONFIG_VIRTIO_VSOCK");
305117d6495STianjia Zhang 
306117d6495STianjia Zhang 	return 0;
307117d6495STianjia Zhang }
308117d6495STianjia Zhang 
309117d6495STianjia Zhang static int virtio_vsock_exit_one(struct kvm *kvm, struct vsock_dev *vdev)
310117d6495STianjia Zhang {
311117d6495STianjia Zhang 	list_del(&vdev->list);
312117d6495STianjia Zhang 	free(vdev);
313117d6495STianjia Zhang 
314117d6495STianjia Zhang 	return 0;
315117d6495STianjia Zhang }
316117d6495STianjia Zhang 
317117d6495STianjia Zhang int virtio_vsock_init(struct kvm *kvm)
318117d6495STianjia Zhang {
319117d6495STianjia Zhang 	int r;
320117d6495STianjia Zhang 
321117d6495STianjia Zhang 	if (kvm->cfg.vsock_cid == 0)
322117d6495STianjia Zhang 		return 0;
323117d6495STianjia Zhang 
324117d6495STianjia Zhang 	r = virtio_vsock_init_one(kvm, kvm->cfg.vsock_cid);
325117d6495STianjia Zhang 	if (r < 0)
326117d6495STianjia Zhang 		goto cleanup;
327117d6495STianjia Zhang 
328117d6495STianjia Zhang 	return 0;
329117d6495STianjia Zhang cleanup:
330117d6495STianjia Zhang 	return virtio_vsock_exit(kvm);
331117d6495STianjia Zhang }
332117d6495STianjia Zhang virtio_dev_init(virtio_vsock_init);
333117d6495STianjia Zhang 
334117d6495STianjia Zhang int virtio_vsock_exit(struct kvm *kvm)
335117d6495STianjia Zhang {
336117d6495STianjia Zhang 	while (!list_empty(&vdevs)) {
337117d6495STianjia Zhang 		struct vsock_dev *vdev;
338117d6495STianjia Zhang 
339117d6495STianjia Zhang 		vdev = list_first_entry(&vdevs, struct vsock_dev, list);
340117d6495STianjia Zhang 		virtio_vsock_exit_one(kvm, vdev);
341117d6495STianjia Zhang 	}
342117d6495STianjia Zhang 
343117d6495STianjia Zhang 	return 0;
344117d6495STianjia Zhang }
345117d6495STianjia Zhang virtio_dev_exit(virtio_vsock_exit);
346