xref: /kvmtool/virtio/vsock.c (revision 9b46ebc561d3cc3bb54a350e4eed94d24562f347)
1117d6495STianjia Zhang #include "kvm/virtio-vsock.h"
2117d6495STianjia Zhang #include "kvm/virtio-pci-dev.h"
3117d6495STianjia Zhang #include "kvm/kvm.h"
4117d6495STianjia Zhang #include "kvm/pci.h"
5117d6495STianjia Zhang #include "kvm/ioeventfd.h"
6117d6495STianjia Zhang #include "kvm/guest_compat.h"
7117d6495STianjia Zhang #include "kvm/virtio-pci.h"
8117d6495STianjia Zhang #include "kvm/virtio.h"
9117d6495STianjia Zhang 
10867b15ccSJean-Philippe Brucker #include <linux/byteorder.h>
11117d6495STianjia Zhang #include <linux/kernel.h>
12117d6495STianjia Zhang #include <linux/virtio_vsock.h>
13117d6495STianjia Zhang #include <linux/vhost.h>
14117d6495STianjia Zhang 
15117d6495STianjia Zhang #define VIRTIO_VSOCK_QUEUE_SIZE		128
16117d6495STianjia Zhang 
17117d6495STianjia Zhang static LIST_HEAD(vdevs);
18117d6495STianjia Zhang static int compat_id = -1;
19117d6495STianjia Zhang 
20117d6495STianjia Zhang enum {
21117d6495STianjia Zhang 	VSOCK_VQ_RX     = 0, /* for host to guest data */
22117d6495STianjia Zhang 	VSOCK_VQ_TX     = 1, /* for guest to host data */
23117d6495STianjia Zhang 	VSOCK_VQ_EVENT  = 2,
24117d6495STianjia Zhang 	VSOCK_VQ_MAX    = 3,
25117d6495STianjia Zhang };
26117d6495STianjia Zhang 
27117d6495STianjia Zhang struct vsock_dev {
28117d6495STianjia Zhang 	struct virt_queue		vqs[VSOCK_VQ_MAX];
29117d6495STianjia Zhang 	struct virtio_vsock_config	config;
30867b15ccSJean-Philippe Brucker 	u64				guest_cid;
31117d6495STianjia Zhang 	u32				features;
32117d6495STianjia Zhang 	int				vhost_fd;
33117d6495STianjia Zhang 	struct virtio_device		vdev;
34117d6495STianjia Zhang 	struct list_head		list;
35117d6495STianjia Zhang 	struct kvm			*kvm;
36117d6495STianjia Zhang };
37117d6495STianjia Zhang 
38117d6495STianjia Zhang static u8 *get_config(struct kvm *kvm, void *dev)
39117d6495STianjia Zhang {
40117d6495STianjia Zhang 	struct vsock_dev *vdev = dev;
41117d6495STianjia Zhang 
42117d6495STianjia Zhang 	return ((u8 *)(&vdev->config));
43117d6495STianjia Zhang }
44117d6495STianjia Zhang 
45e4730284SMartin Radev static size_t get_config_size(struct kvm *kvm, void *dev)
46e4730284SMartin Radev {
47e4730284SMartin Radev 	struct vsock_dev *vdev = dev;
48e4730284SMartin Radev 
49e4730284SMartin Radev 	return sizeof(vdev->config);
50e4730284SMartin Radev }
51e4730284SMartin Radev 
523c8f82b8SJean-Philippe Brucker static u64 get_host_features(struct kvm *kvm, void *dev)
53117d6495STianjia Zhang {
54117d6495STianjia Zhang 	return 1UL << VIRTIO_RING_F_EVENT_IDX
55117d6495STianjia Zhang 		| 1UL << VIRTIO_RING_F_INDIRECT_DESC;
56117d6495STianjia Zhang }
57117d6495STianjia Zhang 
58117d6495STianjia Zhang static bool is_event_vq(u32 vq)
59117d6495STianjia Zhang {
60117d6495STianjia Zhang 	return vq == VSOCK_VQ_EVENT;
61117d6495STianjia Zhang }
62117d6495STianjia Zhang 
63609ee906SJean-Philippe Brucker static int init_vq(struct kvm *kvm, void *dev, u32 vq)
64117d6495STianjia Zhang {
65117d6495STianjia Zhang 	struct vhost_vring_state state = { .index = vq };
66117d6495STianjia Zhang 	struct vhost_vring_addr addr;
67117d6495STianjia Zhang 	struct vsock_dev *vdev = dev;
68117d6495STianjia Zhang 	struct virt_queue *queue;
69117d6495STianjia Zhang 	int r;
70117d6495STianjia Zhang 
71117d6495STianjia Zhang 	compat__remove_message(compat_id);
72117d6495STianjia Zhang 
73117d6495STianjia Zhang 	queue		= &vdev->vqs[vq];
74609ee906SJean-Philippe Brucker 	virtio_init_device_vq(kvm, &vdev->vdev, queue, VIRTIO_VSOCK_QUEUE_SIZE);
75117d6495STianjia Zhang 
76117d6495STianjia Zhang 	if (vdev->vhost_fd == -1)
77117d6495STianjia Zhang 		return 0;
78117d6495STianjia Zhang 
79117d6495STianjia Zhang 	if (is_event_vq(vq))
80117d6495STianjia Zhang 		return 0;
81117d6495STianjia Zhang 
82117d6495STianjia Zhang 	state.num = queue->vring.num;
83117d6495STianjia Zhang 	r = ioctl(vdev->vhost_fd, VHOST_SET_VRING_NUM, &state);
84117d6495STianjia Zhang 	if (r < 0)
85117d6495STianjia Zhang 		die_perror("VHOST_SET_VRING_NUM failed");
86117d6495STianjia Zhang 
87117d6495STianjia Zhang 	state.num = 0;
88117d6495STianjia Zhang 	r = ioctl(vdev->vhost_fd, VHOST_SET_VRING_BASE, &state);
89117d6495STianjia Zhang 	if (r < 0)
90117d6495STianjia Zhang 		die_perror("VHOST_SET_VRING_BASE failed");
91117d6495STianjia Zhang 
92117d6495STianjia Zhang 	addr = (struct vhost_vring_addr) {
93117d6495STianjia Zhang 		.index = vq,
94117d6495STianjia Zhang 		.desc_user_addr = (u64)(unsigned long)queue->vring.desc,
95117d6495STianjia Zhang 		.avail_user_addr = (u64)(unsigned long)queue->vring.avail,
96117d6495STianjia Zhang 		.used_user_addr = (u64)(unsigned long)queue->vring.used,
97117d6495STianjia Zhang 	};
98117d6495STianjia Zhang 
99117d6495STianjia Zhang 	r = ioctl(vdev->vhost_fd, VHOST_SET_VRING_ADDR, &addr);
100117d6495STianjia Zhang 	if (r < 0)
101117d6495STianjia Zhang 		die_perror("VHOST_SET_VRING_ADDR failed");
102117d6495STianjia Zhang 
103117d6495STianjia Zhang 	return 0;
104117d6495STianjia Zhang }
105117d6495STianjia Zhang 
106117d6495STianjia Zhang static void notify_vq_eventfd(struct kvm *kvm, void *dev, u32 vq, u32 efd)
107117d6495STianjia Zhang {
108117d6495STianjia Zhang 	struct vsock_dev *vdev = dev;
109117d6495STianjia Zhang 	struct vhost_vring_file file = {
110117d6495STianjia Zhang 		.index	= vq,
111117d6495STianjia Zhang 		.fd	= efd,
112117d6495STianjia Zhang 	};
113117d6495STianjia Zhang 	int r;
114117d6495STianjia Zhang 
115117d6495STianjia Zhang 	if (is_event_vq(vq))
116117d6495STianjia Zhang 		return;
117117d6495STianjia Zhang 
118117d6495STianjia Zhang 	if (vdev->vhost_fd == -1)
119117d6495STianjia Zhang 		return;
120117d6495STianjia Zhang 
121117d6495STianjia Zhang 	r = ioctl(vdev->vhost_fd, VHOST_SET_VRING_KICK, &file);
122117d6495STianjia Zhang 	if (r < 0)
123117d6495STianjia Zhang 		die_perror("VHOST_SET_VRING_KICK failed");
124117d6495STianjia Zhang }
125117d6495STianjia Zhang 
126117d6495STianjia Zhang static void notify_status(struct kvm *kvm, void *dev, u32 status)
127117d6495STianjia Zhang {
128117d6495STianjia Zhang 	struct vsock_dev *vdev = dev;
129117d6495STianjia Zhang 	int r, start;
130117d6495STianjia Zhang 
131867b15ccSJean-Philippe Brucker 	if (status & VIRTIO__STATUS_CONFIG)
132867b15ccSJean-Philippe Brucker 		vdev->config.guest_cid = cpu_to_le64(vdev->guest_cid);
133867b15ccSJean-Philippe Brucker 
134a8e397bbSJean-Philippe Brucker 	if (status & VIRTIO__STATUS_START)
135a8e397bbSJean-Philippe Brucker 		start = 1;
136a8e397bbSJean-Philippe Brucker 	else if (status & VIRTIO__STATUS_STOP)
137a8e397bbSJean-Philippe Brucker 		start = 0;
138a8e397bbSJean-Philippe Brucker 	else
139117d6495STianjia Zhang 		return;
140117d6495STianjia Zhang 
141117d6495STianjia Zhang 	r = ioctl(vdev->vhost_fd, VHOST_VSOCK_SET_RUNNING, &start);
142117d6495STianjia Zhang 	if (r != 0)
143117d6495STianjia Zhang 		die("VHOST_VSOCK_SET_RUNNING failed %d", errno);
144117d6495STianjia Zhang }
145117d6495STianjia Zhang 
146117d6495STianjia Zhang static int notify_vq(struct kvm *kvm, void *dev, u32 vq)
147117d6495STianjia Zhang {
148117d6495STianjia Zhang 	return 0;
149117d6495STianjia Zhang }
150117d6495STianjia Zhang 
151117d6495STianjia Zhang static struct virt_queue *get_vq(struct kvm *kvm, void *dev, u32 vq)
152117d6495STianjia Zhang {
153117d6495STianjia Zhang 	struct vsock_dev *vdev = dev;
154117d6495STianjia Zhang 
155117d6495STianjia Zhang 	return &vdev->vqs[vq];
156117d6495STianjia Zhang }
157117d6495STianjia Zhang 
158117d6495STianjia Zhang static int get_size_vq(struct kvm *kvm, void *dev, u32 vq)
159117d6495STianjia Zhang {
160117d6495STianjia Zhang 	return VIRTIO_VSOCK_QUEUE_SIZE;
161117d6495STianjia Zhang }
162117d6495STianjia Zhang 
163117d6495STianjia Zhang static int set_size_vq(struct kvm *kvm, void *dev, u32 vq, int size)
164117d6495STianjia Zhang {
165117d6495STianjia Zhang 	return size;
166117d6495STianjia Zhang }
167117d6495STianjia Zhang 
168117d6495STianjia Zhang static void notify_vq_gsi(struct kvm *kvm, void *dev, u32 vq, u32 gsi)
169117d6495STianjia Zhang {
170117d6495STianjia Zhang 	struct vhost_vring_file file;
171117d6495STianjia Zhang 	struct vsock_dev *vdev = dev;
172117d6495STianjia Zhang 	struct kvm_irqfd irq;
173117d6495STianjia Zhang 	int r;
174117d6495STianjia Zhang 
175117d6495STianjia Zhang 	if (vdev->vhost_fd == -1)
176117d6495STianjia Zhang 		return;
177117d6495STianjia Zhang 
178117d6495STianjia Zhang 	if (is_event_vq(vq))
179117d6495STianjia Zhang 		return;
180117d6495STianjia Zhang 
181117d6495STianjia Zhang 	irq = (struct kvm_irqfd) {
182117d6495STianjia Zhang 		.gsi	= gsi,
183117d6495STianjia Zhang 		.fd	= eventfd(0, 0),
184117d6495STianjia Zhang 	};
185117d6495STianjia Zhang 	file = (struct vhost_vring_file) {
186117d6495STianjia Zhang 		.index	= vq,
187117d6495STianjia Zhang 		.fd	= irq.fd,
188117d6495STianjia Zhang 	};
189117d6495STianjia Zhang 
190117d6495STianjia Zhang 	r = ioctl(kvm->vm_fd, KVM_IRQFD, &irq);
191117d6495STianjia Zhang 	if (r < 0)
192117d6495STianjia Zhang 		die_perror("KVM_IRQFD failed");
193117d6495STianjia Zhang 
194117d6495STianjia Zhang 	r = ioctl(vdev->vhost_fd, VHOST_SET_VRING_CALL, &file);
195117d6495STianjia Zhang 	if (r < 0)
196117d6495STianjia Zhang 		die_perror("VHOST_SET_VRING_CALL failed");
197117d6495STianjia Zhang }
198117d6495STianjia Zhang 
19931e0eaccSMartin Radev static unsigned int get_vq_count(struct kvm *kvm, void *dev)
200117d6495STianjia Zhang {
201117d6495STianjia Zhang 	return VSOCK_VQ_MAX;
202117d6495STianjia Zhang }
203117d6495STianjia Zhang 
204117d6495STianjia Zhang static struct virtio_ops vsock_dev_virtio_ops = {
205117d6495STianjia Zhang 	.get_config		= get_config,
206e4730284SMartin Radev 	.get_config_size	= get_config_size,
207117d6495STianjia Zhang 	.get_host_features	= get_host_features,
208117d6495STianjia Zhang 	.init_vq		= init_vq,
209117d6495STianjia Zhang 	.get_vq			= get_vq,
210117d6495STianjia Zhang 	.get_size_vq		= get_size_vq,
211117d6495STianjia Zhang 	.set_size_vq		= set_size_vq,
212117d6495STianjia Zhang 	.notify_vq_eventfd	= notify_vq_eventfd,
213117d6495STianjia Zhang 	.notify_status		= notify_status,
214117d6495STianjia Zhang 	.notify_vq_gsi		= notify_vq_gsi,
215117d6495STianjia Zhang 	.notify_vq		= notify_vq,
216117d6495STianjia Zhang 	.get_vq_count		= get_vq_count,
217117d6495STianjia Zhang };
218117d6495STianjia Zhang 
219117d6495STianjia Zhang static void virtio_vhost_vsock_init(struct kvm *kvm, struct vsock_dev *vdev)
220117d6495STianjia Zhang {
221117d6495STianjia Zhang 	struct kvm_mem_bank *bank;
222117d6495STianjia Zhang 	struct vhost_memory *mem;
223117d6495STianjia Zhang 	u64 features;
224117d6495STianjia Zhang 	int r, i;
225117d6495STianjia Zhang 
226117d6495STianjia Zhang 	vdev->vhost_fd = open("/dev/vhost-vsock", O_RDWR);
227117d6495STianjia Zhang 	if (vdev->vhost_fd < 0)
228117d6495STianjia Zhang 		die_perror("Failed opening vhost-vsock device");
229117d6495STianjia Zhang 
230117d6495STianjia Zhang 	mem = calloc(1, sizeof(*mem) + sizeof(struct vhost_memory_region));
231117d6495STianjia Zhang 	if (mem == NULL)
232117d6495STianjia Zhang 		die("Failed allocating memory for vhost memory map");
233117d6495STianjia Zhang 
234117d6495STianjia Zhang 	i = 0;
235117d6495STianjia Zhang 	list_for_each_entry(bank, &kvm->mem_banks, list) {
236117d6495STianjia Zhang 		mem->regions[i] = (struct vhost_memory_region) {
237117d6495STianjia Zhang 			.guest_phys_addr = bank->guest_phys_addr,
238117d6495STianjia Zhang 			.memory_size	 = bank->size,
239117d6495STianjia Zhang 			.userspace_addr	 = (unsigned long)bank->host_addr,
240117d6495STianjia Zhang 		};
241117d6495STianjia Zhang 		i++;
242117d6495STianjia Zhang 	}
243117d6495STianjia Zhang 	mem->nregions = i;
244117d6495STianjia Zhang 
245117d6495STianjia Zhang 	r = ioctl(vdev->vhost_fd, VHOST_SET_OWNER);
246117d6495STianjia Zhang 	if (r != 0)
247117d6495STianjia Zhang 		die_perror("VHOST_SET_OWNER failed");
248117d6495STianjia Zhang 
249117d6495STianjia Zhang 	r = ioctl(vdev->vhost_fd, VHOST_SET_MEM_TABLE, mem);
250117d6495STianjia Zhang 	if (r != 0)
251117d6495STianjia Zhang 		die_perror("VHOST_SET_MEM_TABLE failed");
252117d6495STianjia Zhang 
253117d6495STianjia Zhang 	r = ioctl(vdev->vhost_fd, VHOST_GET_FEATURES, &features);
254117d6495STianjia Zhang 	if (r != 0)
255117d6495STianjia Zhang 		die_perror("VHOST_GET_FEATURES failed");
256117d6495STianjia Zhang 
257117d6495STianjia Zhang 	r = ioctl(vdev->vhost_fd, VHOST_SET_FEATURES, &features);
258117d6495STianjia Zhang 	if (r != 0)
259117d6495STianjia Zhang 		die_perror("VHOST_SET_FEATURES failed");
260117d6495STianjia Zhang 
261867b15ccSJean-Philippe Brucker 	r = ioctl(vdev->vhost_fd, VHOST_VSOCK_SET_GUEST_CID, &vdev->guest_cid);
262117d6495STianjia Zhang 	if (r != 0)
263117d6495STianjia Zhang 		die_perror("VHOST_VSOCK_SET_GUEST_CID failed");
264117d6495STianjia Zhang 
265117d6495STianjia Zhang 	vdev->vdev.use_vhost = true;
266117d6495STianjia Zhang 
267117d6495STianjia Zhang 	free(mem);
268117d6495STianjia Zhang }
269117d6495STianjia Zhang 
270117d6495STianjia Zhang static int virtio_vsock_init_one(struct kvm *kvm, u64 guest_cid)
271117d6495STianjia Zhang {
272117d6495STianjia Zhang 	struct vsock_dev *vdev;
273117d6495STianjia Zhang 	int r;
274117d6495STianjia Zhang 
275117d6495STianjia Zhang 	vdev = calloc(1, sizeof(struct vsock_dev));
276117d6495STianjia Zhang 	if (vdev == NULL)
277117d6495STianjia Zhang 		return -ENOMEM;
278117d6495STianjia Zhang 
279117d6495STianjia Zhang 	*vdev = (struct vsock_dev) {
280117d6495STianjia Zhang 		.guest_cid		= guest_cid,
281117d6495STianjia Zhang 		.vhost_fd		= -1,
282117d6495STianjia Zhang 		.kvm			= kvm,
283117d6495STianjia Zhang 	};
284117d6495STianjia Zhang 
285117d6495STianjia Zhang 	list_add_tail(&vdev->list, &vdevs);
286117d6495STianjia Zhang 
287117d6495STianjia Zhang 	r = virtio_init(kvm, vdev, &vdev->vdev, &vsock_dev_virtio_ops,
288*9b46ebc5SRajnesh Kanwal 		    kvm->cfg.virtio_transport, PCI_DEVICE_ID_VIRTIO_VSOCK,
289117d6495STianjia Zhang 		    VIRTIO_ID_VSOCK, PCI_CLASS_VSOCK);
290117d6495STianjia Zhang 	if (r < 0)
291117d6495STianjia Zhang 	    return r;
292117d6495STianjia Zhang 
293117d6495STianjia Zhang 	virtio_vhost_vsock_init(kvm, vdev);
294117d6495STianjia Zhang 
295117d6495STianjia Zhang 	if (compat_id == -1)
296117d6495STianjia Zhang 		compat_id = virtio_compat_add_message("virtio-vsock", "CONFIG_VIRTIO_VSOCK");
297117d6495STianjia Zhang 
298117d6495STianjia Zhang 	return 0;
299117d6495STianjia Zhang }
300117d6495STianjia Zhang 
301117d6495STianjia Zhang static int virtio_vsock_exit_one(struct kvm *kvm, struct vsock_dev *vdev)
302117d6495STianjia Zhang {
303117d6495STianjia Zhang 	list_del(&vdev->list);
304117d6495STianjia Zhang 	free(vdev);
305117d6495STianjia Zhang 
306117d6495STianjia Zhang 	return 0;
307117d6495STianjia Zhang }
308117d6495STianjia Zhang 
309117d6495STianjia Zhang int virtio_vsock_init(struct kvm *kvm)
310117d6495STianjia Zhang {
311117d6495STianjia Zhang 	int r;
312117d6495STianjia Zhang 
313117d6495STianjia Zhang 	if (kvm->cfg.vsock_cid == 0)
314117d6495STianjia Zhang 		return 0;
315117d6495STianjia Zhang 
316117d6495STianjia Zhang 	r = virtio_vsock_init_one(kvm, kvm->cfg.vsock_cid);
317117d6495STianjia Zhang 	if (r < 0)
318117d6495STianjia Zhang 		goto cleanup;
319117d6495STianjia Zhang 
320117d6495STianjia Zhang 	return 0;
321117d6495STianjia Zhang cleanup:
322117d6495STianjia Zhang 	return virtio_vsock_exit(kvm);
323117d6495STianjia Zhang }
324117d6495STianjia Zhang virtio_dev_init(virtio_vsock_init);
325117d6495STianjia Zhang 
326117d6495STianjia Zhang int virtio_vsock_exit(struct kvm *kvm)
327117d6495STianjia Zhang {
328117d6495STianjia Zhang 	while (!list_empty(&vdevs)) {
329117d6495STianjia Zhang 		struct vsock_dev *vdev;
330117d6495STianjia Zhang 
331117d6495STianjia Zhang 		vdev = list_first_entry(&vdevs, struct vsock_dev, list);
332117d6495STianjia Zhang 		virtio_vsock_exit_one(kvm, vdev);
333117d6495STianjia Zhang 	}
334117d6495STianjia Zhang 
335117d6495STianjia Zhang 	return 0;
336117d6495STianjia Zhang }
337117d6495STianjia Zhang virtio_dev_exit(virtio_vsock_exit);
338