xref: /kvmtool/virtio/net.c (revision eef27ae368562bcce4f8a2b65822b307da0d4146)
131638bcaSCyrill Gorcunov #include "kvm/virtio-pci-dev.h"
2b5ee1ea7SAsias He #include "kvm/virtio-net.h"
34f56d42cSAsias He #include "kvm/virtio.h"
44f56d42cSAsias He #include "kvm/mutex.h"
54f56d42cSAsias He #include "kvm/util.h"
64f56d42cSAsias He #include "kvm/kvm.h"
72449f6e3SSasha Levin #include "kvm/irq.h"
8b5ee1ea7SAsias He #include "kvm/uip.h"
9cb83de6fSSasha Levin #include "kvm/guest_compat.h"
107668c3a6SSasha Levin #include "kvm/iovec.h"
114f56d42cSAsias He 
129ed67cdcSSasha Levin #include <linux/vhost.h>
134f56d42cSAsias He #include <linux/virtio_net.h>
144f56d42cSAsias He #include <linux/if_tun.h>
1578a2a3e2SSasha Levin #include <linux/types.h>
16c229370aSIngo Molnar 
17c229370aSIngo Molnar #include <arpa/inet.h>
184f56d42cSAsias He #include <net/if.h>
19c229370aSIngo Molnar 
20c229370aSIngo Molnar #include <unistd.h>
214f56d42cSAsias He #include <fcntl.h>
22c229370aSIngo Molnar 
23cb7202c1SSasha Levin #include <sys/socket.h>
24c229370aSIngo Molnar #include <sys/ioctl.h>
25c229370aSIngo Molnar #include <sys/types.h>
2673b7d038SAmos Kong #include <sys/wait.h>
279ed67cdcSSasha Levin #include <sys/eventfd.h>
284f56d42cSAsias He 
294059ad8bSAsias He #define VIRTIO_NET_QUEUE_SIZE		256
306585ffb7SSasha Levin #define VIRTIO_NET_NUM_QUEUES		8
314f56d42cSAsias He 
32b4fdde6dSAsias He struct net_dev;
33b4fdde6dSAsias He 
34b4fdde6dSAsias He struct net_dev_operations {
35b4fdde6dSAsias He 	int (*rx)(struct iovec *iov, u16 in, struct net_dev *ndev);
36b4fdde6dSAsias He 	int (*tx)(struct iovec *iov, u16 in, struct net_dev *ndev);
37b4fdde6dSAsias He };
38b4fdde6dSAsias He 
398626798bSAsias He struct net_dev {
40d3476f7dSSasha Levin 	struct mutex			mutex;
4102eca50cSAsias He 	struct virtio_device		vdev;
429a6d73f1SSasha Levin 	struct list_head		list;
434f56d42cSAsias He 
446585ffb7SSasha Levin 	struct virt_queue		vqs[VIRTIO_NET_NUM_QUEUES * 2 + 1];
45c229370aSIngo Molnar 	struct virtio_net_config	config;
4679052597SSasha Levin 	u32				features, rx_vqs, tx_vqs, queue_pairs;
474f56d42cSAsias He 
486585ffb7SSasha Levin 	pthread_t			io_thread[VIRTIO_NET_NUM_QUEUES * 2 + 1];
496585ffb7SSasha Levin 	struct mutex			io_lock[VIRTIO_NET_NUM_QUEUES * 2 + 1];
506585ffb7SSasha Levin 	pthread_cond_t			io_cond[VIRTIO_NET_NUM_QUEUES * 2 + 1];
51c4aa7c02SPekka Enberg 
529ed67cdcSSasha Levin 	int				vhost_fd;
534f56d42cSAsias He 	int				tap_fd;
544f56d42cSAsias He 	char				tap_name[IFNAMSIZ];
55bb1a32f1SAsias He 
56bb1a32f1SAsias He 	int				mode;
57bb1a32f1SAsias He 
58b5ee1ea7SAsias He 	struct uip_info			info;
59b4fdde6dSAsias He 	struct net_dev_operations	*ops;
609a6d73f1SSasha Levin 	struct kvm			*kvm;
618c0ae74dSSasha Levin 
628c0ae74dSSasha Levin 	struct virtio_net_params	*params;
634f56d42cSAsias He };
644f56d42cSAsias He 
659a6d73f1SSasha Levin static LIST_HEAD(ndevs);
66312c62d1SSasha Levin static int compat_id = -1;
674f56d42cSAsias He 
687668c3a6SSasha Levin #define MAX_PACKET_SIZE 65550
697668c3a6SSasha Levin 
707668c3a6SSasha Levin static bool has_virtio_feature(struct net_dev *ndev, u32 feature)
717668c3a6SSasha Levin {
727668c3a6SSasha Levin 	return ndev->features & (1 << feature);
737668c3a6SSasha Levin }
747668c3a6SSasha Levin 
758ed60bbeSMarc Zyngier static void virtio_net_fix_tx_hdr(struct virtio_net_hdr *hdr, struct net_dev *ndev)
768ed60bbeSMarc Zyngier {
778ed60bbeSMarc Zyngier 	hdr->hdr_len		= virtio_guest_to_host_u16(&ndev->vdev, hdr->hdr_len);
788ed60bbeSMarc Zyngier 	hdr->gso_size		= virtio_guest_to_host_u16(&ndev->vdev, hdr->gso_size);
798ed60bbeSMarc Zyngier 	hdr->csum_start		= virtio_guest_to_host_u16(&ndev->vdev, hdr->csum_start);
808ed60bbeSMarc Zyngier 	hdr->csum_offset	= virtio_guest_to_host_u16(&ndev->vdev, hdr->csum_offset);
818ed60bbeSMarc Zyngier }
828ed60bbeSMarc Zyngier 
838ed60bbeSMarc Zyngier static void virtio_net_fix_rx_hdr(struct virtio_net_hdr_mrg_rxbuf *hdr, struct net_dev *ndev)
848ed60bbeSMarc Zyngier {
858ed60bbeSMarc Zyngier 	hdr->hdr.hdr_len	= virtio_host_to_guest_u16(&ndev->vdev, hdr->hdr.hdr_len);
868ed60bbeSMarc Zyngier 	hdr->hdr.gso_size	= virtio_host_to_guest_u16(&ndev->vdev, hdr->hdr.gso_size);
878ed60bbeSMarc Zyngier 	hdr->hdr.csum_start	= virtio_host_to_guest_u16(&ndev->vdev, hdr->hdr.csum_start);
888ed60bbeSMarc Zyngier 	hdr->hdr.csum_offset	= virtio_host_to_guest_u16(&ndev->vdev, hdr->hdr.csum_offset);
898ed60bbeSMarc Zyngier 	if (has_virtio_feature(ndev, VIRTIO_NET_F_MRG_RXBUF))
908ed60bbeSMarc Zyngier 		hdr->num_buffers	= virtio_host_to_guest_u16(&ndev->vdev, hdr->num_buffers);
918ed60bbeSMarc Zyngier }
928ed60bbeSMarc Zyngier 
93c4aa7c02SPekka Enberg static void *virtio_net_rx_thread(void *p)
944f56d42cSAsias He {
954f56d42cSAsias He 	struct iovec iov[VIRTIO_NET_QUEUE_SIZE];
964f56d42cSAsias He 	struct virt_queue *vq;
9743835ac9SSasha Levin 	struct kvm *kvm;
989a6d73f1SSasha Levin 	struct net_dev *ndev = p;
993fdf659dSSasha Levin 	u16 out, in;
1003fdf659dSSasha Levin 	u16 head;
1016d6cc14bSWill Deacon 	int len, copied;
1026585ffb7SSasha Levin 	u32 id;
1036585ffb7SSasha Levin 
1046585ffb7SSasha Levin 	mutex_lock(&ndev->mutex);
1056585ffb7SSasha Levin 	id = ndev->rx_vqs++ * 2;
1066585ffb7SSasha Levin 	mutex_unlock(&ndev->mutex);
1074f56d42cSAsias He 
108a4d8c55eSSasha Levin 	kvm__set_thread_name("virtio-net-rx");
109a4d8c55eSSasha Levin 
1109a6d73f1SSasha Levin 	kvm = ndev->kvm;
1116585ffb7SSasha Levin 	vq = &ndev->vqs[id];
112c4aa7c02SPekka Enberg 
113c4aa7c02SPekka Enberg 	while (1) {
1146585ffb7SSasha Levin 		mutex_lock(&ndev->io_lock[id]);
115c4aa7c02SPekka Enberg 		if (!virt_queue__available(vq))
1166585ffb7SSasha Levin 			pthread_cond_wait(&ndev->io_cond[id], &ndev->io_lock[id].mutex);
1176585ffb7SSasha Levin 		mutex_unlock(&ndev->io_lock[id]);
1184f56d42cSAsias He 
1194f56d42cSAsias He 		while (virt_queue__available(vq)) {
1207668c3a6SSasha Levin 			unsigned char buffer[MAX_PACKET_SIZE + sizeof(struct virtio_net_hdr_mrg_rxbuf)];
1217668c3a6SSasha Levin 			struct iovec dummy_iov = {
1227668c3a6SSasha Levin 				.iov_base = buffer,
1237668c3a6SSasha Levin 				.iov_len  = sizeof(buffer),
1247668c3a6SSasha Levin 			};
1257668c3a6SSasha Levin 			struct virtio_net_hdr_mrg_rxbuf *hdr;
1268ed60bbeSMarc Zyngier 			int i;
1277f5ffaf5SAsias He 
1287668c3a6SSasha Levin 			len = ndev->ops->rx(&dummy_iov, 1, ndev);
1296d6cc14bSWill Deacon 			if (len < 0) {
1306d6cc14bSWill Deacon 				pr_warning("%s: rx on vq %u failed (%d), exiting thread\n",
1316d6cc14bSWill Deacon 						__func__, id, len);
1326d6cc14bSWill Deacon 				goto out_err;
1336d6cc14bSWill Deacon 			}
1346d6cc14bSWill Deacon 
1358ed60bbeSMarc Zyngier 			copied = i = 0;
1367668c3a6SSasha Levin 			head = virt_queue__get_iov(vq, iov, &out, &in, kvm);
1378ed60bbeSMarc Zyngier 			hdr = iov[0].iov_base;
1387668c3a6SSasha Levin 			while (copied < len) {
1396d6cc14bSWill Deacon 				size_t iovsize = min_t(size_t, len - copied, iov_size(iov, in));
1407668c3a6SSasha Levin 
141e2493047SAsias He 				memcpy_toiovec(iov, buffer + copied, iovsize);
1427668c3a6SSasha Levin 				copied += iovsize;
1438ed60bbeSMarc Zyngier 				if (i++ == 0)
1448ed60bbeSMarc Zyngier 					virtio_net_fix_rx_hdr(hdr, ndev);
1458ed60bbeSMarc Zyngier 				if (has_virtio_feature(ndev, VIRTIO_NET_F_MRG_RXBUF)) {
1468ed60bbeSMarc Zyngier 					u16 num_buffers = virtio_guest_to_host_u16(vq, hdr->num_buffers);
1478ed60bbeSMarc Zyngier 					hdr->num_buffers = virtio_host_to_guest_u16(vq, num_buffers + 1);
1488ed60bbeSMarc Zyngier 				}
1497668c3a6SSasha Levin 				virt_queue__set_used_elem(vq, head, iovsize);
1507668c3a6SSasha Levin 				if (copied == len)
1517668c3a6SSasha Levin 					break;
1527668c3a6SSasha Levin 				while (!virt_queue__available(vq))
1537668c3a6SSasha Levin 					sleep(0);
1547668c3a6SSasha Levin 				head = virt_queue__get_iov(vq, iov, &out, &in, kvm);
1557668c3a6SSasha Levin 			}
156c4aa7c02SPekka Enberg 			/* We should interrupt guest right now, otherwise latency is huge. */
1576585ffb7SSasha Levin 			if (virtio_queue__should_signal(vq))
1586585ffb7SSasha Levin 				ndev->vdev.ops->signal_vq(kvm, &ndev->vdev, id);
1594f56d42cSAsias He 		}
160c4aa7c02SPekka Enberg 	}
161c4aa7c02SPekka Enberg 
1626d6cc14bSWill Deacon out_err:
163c4aa7c02SPekka Enberg 	pthread_exit(NULL);
164c4aa7c02SPekka Enberg 	return NULL;
165c4aa7c02SPekka Enberg 
166c4aa7c02SPekka Enberg }
167c4aa7c02SPekka Enberg 
168c4aa7c02SPekka Enberg static void *virtio_net_tx_thread(void *p)
1694f56d42cSAsias He {
1704f56d42cSAsias He 	struct iovec iov[VIRTIO_NET_QUEUE_SIZE];
1714f56d42cSAsias He 	struct virt_queue *vq;
17243835ac9SSasha Levin 	struct kvm *kvm;
1739a6d73f1SSasha Levin 	struct net_dev *ndev = p;
1743fdf659dSSasha Levin 	u16 out, in;
1753fdf659dSSasha Levin 	u16 head;
1764f56d42cSAsias He 	int len;
1776585ffb7SSasha Levin 	u32 id;
1786585ffb7SSasha Levin 
1796585ffb7SSasha Levin 	mutex_lock(&ndev->mutex);
1806585ffb7SSasha Levin 	id = ndev->tx_vqs++ * 2 + 1;
1816585ffb7SSasha Levin 	mutex_unlock(&ndev->mutex);
1824f56d42cSAsias He 
183a4d8c55eSSasha Levin 	kvm__set_thread_name("virtio-net-tx");
184a4d8c55eSSasha Levin 
1859a6d73f1SSasha Levin 	kvm = ndev->kvm;
1866585ffb7SSasha Levin 	vq = &ndev->vqs[id];
187c4aa7c02SPekka Enberg 
188c4aa7c02SPekka Enberg 	while (1) {
1896585ffb7SSasha Levin 		mutex_lock(&ndev->io_lock[id]);
190c4aa7c02SPekka Enberg 		if (!virt_queue__available(vq))
1916585ffb7SSasha Levin 			pthread_cond_wait(&ndev->io_cond[id], &ndev->io_lock[id].mutex);
1926585ffb7SSasha Levin 		mutex_unlock(&ndev->io_lock[id]);
1934f56d42cSAsias He 
1944f56d42cSAsias He 		while (virt_queue__available(vq)) {
1958ed60bbeSMarc Zyngier 			struct virtio_net_hdr *hdr;
19643835ac9SSasha Levin 			head = virt_queue__get_iov(vq, iov, &out, &in, kvm);
1978ed60bbeSMarc Zyngier 			hdr = iov[0].iov_base;
1988ed60bbeSMarc Zyngier 			virtio_net_fix_tx_hdr(hdr, ndev);
1999a6d73f1SSasha Levin 			len = ndev->ops->tx(iov, out, ndev);
2006d6cc14bSWill Deacon 			if (len < 0) {
2016d6cc14bSWill Deacon 				pr_warning("%s: tx on vq %u failed (%d)\n",
2028ed60bbeSMarc Zyngier 						__func__, id, errno);
2036d6cc14bSWill Deacon 				goto out_err;
2046d6cc14bSWill Deacon 			}
2056d6cc14bSWill Deacon 
2064f56d42cSAsias He 			virt_queue__set_used_elem(vq, head, len);
2074f56d42cSAsias He 		}
2084f56d42cSAsias He 
2096585ffb7SSasha Levin 		if (virtio_queue__should_signal(vq))
2106585ffb7SSasha Levin 			ndev->vdev.ops->signal_vq(kvm, &ndev->vdev, id);
2114f56d42cSAsias He 	}
2124f56d42cSAsias He 
2136d6cc14bSWill Deacon out_err:
214c4aa7c02SPekka Enberg 	pthread_exit(NULL);
215c4aa7c02SPekka Enberg 	return NULL;
216c4aa7c02SPekka Enberg }
217407475bfSPekka Enberg 
2186585ffb7SSasha Levin static virtio_net_ctrl_ack virtio_net_handle_mq(struct kvm* kvm, struct net_dev *ndev, struct virtio_net_ctrl_hdr *ctrl)
2196585ffb7SSasha Levin {
2206585ffb7SSasha Levin 	/* Not much to do here */
2216585ffb7SSasha Levin 	return VIRTIO_NET_OK;
2226585ffb7SSasha Levin }
2236585ffb7SSasha Levin 
2246585ffb7SSasha Levin static void *virtio_net_ctrl_thread(void *p)
225abd4a801SSasha Levin {
226abd4a801SSasha Levin 	struct iovec iov[VIRTIO_NET_QUEUE_SIZE];
227abd4a801SSasha Levin 	u16 out, in, head;
2286585ffb7SSasha Levin 	struct net_dev *ndev = p;
2296585ffb7SSasha Levin 	struct kvm *kvm = ndev->kvm;
23079052597SSasha Levin 	u32 id = ndev->queue_pairs * 2;
2316585ffb7SSasha Levin 	struct virt_queue *vq = &ndev->vqs[id];
232abd4a801SSasha Levin 	struct virtio_net_ctrl_hdr *ctrl;
233abd4a801SSasha Levin 	virtio_net_ctrl_ack *ack;
234abd4a801SSasha Levin 
235edb4a8a0SSuzuki K. Poulose 	kvm__set_thread_name("virtio-net-ctrl");
236edb4a8a0SSuzuki K. Poulose 
2376585ffb7SSasha Levin 	while (1) {
2386585ffb7SSasha Levin 		mutex_lock(&ndev->io_lock[id]);
2396585ffb7SSasha Levin 		if (!virt_queue__available(vq))
2406585ffb7SSasha Levin 			pthread_cond_wait(&ndev->io_cond[id], &ndev->io_lock[id].mutex);
2416585ffb7SSasha Levin 		mutex_unlock(&ndev->io_lock[id]);
2426585ffb7SSasha Levin 
2436585ffb7SSasha Levin 		while (virt_queue__available(vq)) {
2446585ffb7SSasha Levin 			head = virt_queue__get_iov(&ndev->vqs[id], iov, &out, &in, kvm);
245abd4a801SSasha Levin 			ctrl = iov[0].iov_base;
246abd4a801SSasha Levin 			ack = iov[out].iov_base;
247abd4a801SSasha Levin 
248abd4a801SSasha Levin 			switch (ctrl->class) {
2496585ffb7SSasha Levin 			case VIRTIO_NET_CTRL_MQ:
2506585ffb7SSasha Levin 				*ack = virtio_net_handle_mq(kvm, ndev, ctrl);
2516585ffb7SSasha Levin 				break;
252abd4a801SSasha Levin 			default:
253abd4a801SSasha Levin 				*ack = VIRTIO_NET_ERR;
254abd4a801SSasha Levin 				break;
255abd4a801SSasha Levin 			}
2566585ffb7SSasha Levin 			virt_queue__set_used_elem(&ndev->vqs[id], head, iov[out].iov_len);
2576585ffb7SSasha Levin 		}
258abd4a801SSasha Levin 
2596585ffb7SSasha Levin 		if (virtio_queue__should_signal(&ndev->vqs[id]))
2606585ffb7SSasha Levin 			ndev->vdev.ops->signal_vq(kvm, &ndev->vdev, id);
2616585ffb7SSasha Levin 	}
262abd4a801SSasha Levin 
2636585ffb7SSasha Levin 	pthread_exit(NULL);
264abd4a801SSasha Levin 
2656585ffb7SSasha Levin 	return NULL;
266abd4a801SSasha Levin }
267abd4a801SSasha Levin 
2689a6d73f1SSasha Levin static void virtio_net_handle_callback(struct kvm *kvm, struct net_dev *ndev, int queue)
2694f56d42cSAsias He {
27079052597SSasha Levin 	if ((u32)queue >= (ndev->queue_pairs * 2 + 1)) {
2719a6d73f1SSasha Levin 		pr_warning("Unknown queue index %u", queue);
2726585ffb7SSasha Levin 		return;
273c4aa7c02SPekka Enberg 	}
2746585ffb7SSasha Levin 
2756585ffb7SSasha Levin 	mutex_lock(&ndev->io_lock[queue]);
2766585ffb7SSasha Levin 	pthread_cond_signal(&ndev->io_cond[queue]);
2776585ffb7SSasha Levin 	mutex_unlock(&ndev->io_lock[queue]);
2784f56d42cSAsias He }
2794f56d42cSAsias He 
280d2a7ddffSMarc Zyngier static int virtio_net_request_tap(struct net_dev *ndev, struct ifreq *ifr,
281d2a7ddffSMarc Zyngier 				  const char *tapname)
282d2a7ddffSMarc Zyngier {
283d2a7ddffSMarc Zyngier 	int ret;
284d2a7ddffSMarc Zyngier 
285d2a7ddffSMarc Zyngier 	memset(ifr, 0, sizeof(*ifr));
286d2a7ddffSMarc Zyngier 	ifr->ifr_flags = IFF_TAP | IFF_NO_PI | IFF_VNET_HDR;
287d2a7ddffSMarc Zyngier 	if (tapname)
288d2a7ddffSMarc Zyngier 		strncpy(ifr->ifr_name, tapname, sizeof(ifr->ifr_name));
289d2a7ddffSMarc Zyngier 
290f83dc816SAndreas Herrmann 	ret = ioctl(ndev->tap_fd, TUNSETIFF, ifr);
291d2a7ddffSMarc Zyngier 
292d2a7ddffSMarc Zyngier 	if (ret >= 0)
293d2a7ddffSMarc Zyngier 		strncpy(ndev->tap_name, ifr->ifr_name, sizeof(ndev->tap_name));
294d2a7ddffSMarc Zyngier 	return ret;
295d2a7ddffSMarc Zyngier }
296d2a7ddffSMarc Zyngier 
297*eef27ae3SFan Du static int virtio_net_exec_script(const char* script, const char *tap_name)
298*eef27ae3SFan Du {
299*eef27ae3SFan Du 	pid_t pid;
300*eef27ae3SFan Du 	int status;
301*eef27ae3SFan Du 
302*eef27ae3SFan Du 	pid = fork();
303*eef27ae3SFan Du 	if (pid == 0) {
304*eef27ae3SFan Du 		execl(script, script, tap_name, NULL);
305*eef27ae3SFan Du 		_exit(1);
306*eef27ae3SFan Du 	} else {
307*eef27ae3SFan Du 		waitpid(pid, &status, 0);
308*eef27ae3SFan Du 		if (WIFEXITED(status) && WEXITSTATUS(status) != 0) {
309*eef27ae3SFan Du 			pr_warning("Fail to setup tap by %s", script);
310*eef27ae3SFan Du 			return -1;
311*eef27ae3SFan Du 		}
312*eef27ae3SFan Du 	}
313*eef27ae3SFan Du 	return 0;
314*eef27ae3SFan Du }
315*eef27ae3SFan Du 
3168c0ae74dSSasha Levin static bool virtio_net__tap_init(struct net_dev *ndev)
3174f56d42cSAsias He {
318cb7202c1SSasha Levin 	int sock = socket(AF_INET, SOCK_STREAM, 0);
319*eef27ae3SFan Du 	int offload, hdr_len;
320cb7202c1SSasha Levin 	struct sockaddr_in sin = {0};
321246c8347SAsias He 	struct ifreq ifr;
3228c0ae74dSSasha Levin 	const struct virtio_net_params *params = ndev->params;
3231dfc7c24SMarc Zyngier 	bool skipconf = !!params->tapif;
324d2a7ddffSMarc Zyngier 	bool macvtap = skipconf && (params->tapif[0] == '/');
325d2a7ddffSMarc Zyngier 	const char *tap_file = "/dev/net/tun";
3264f56d42cSAsias He 
327f19edd1eSSasha Levin 	/* Did the user already gave us the FD? */
328f19edd1eSSasha Levin 	if (params->fd) {
329f19edd1eSSasha Levin 		ndev->tap_fd = params->fd;
330f19edd1eSSasha Levin 		return 1;
331f19edd1eSSasha Levin 	}
332f19edd1eSSasha Levin 
333d2a7ddffSMarc Zyngier 	if (macvtap)
334d2a7ddffSMarc Zyngier 		tap_file = params->tapif;
335d2a7ddffSMarc Zyngier 
336d2a7ddffSMarc Zyngier 	ndev->tap_fd = open(tap_file, O_RDWR);
3379a6d73f1SSasha Levin 	if (ndev->tap_fd < 0) {
338d2a7ddffSMarc Zyngier 		pr_warning("Unable to open %s", tap_file);
3393b02f580SSasha Levin 		goto fail;
3403b02f580SSasha Levin 	}
3414f56d42cSAsias He 
342d2a7ddffSMarc Zyngier 	if (!macvtap &&
343d2a7ddffSMarc Zyngier 	    virtio_net_request_tap(ndev, &ifr, params->tapif) < 0) {
3444542f276SCyrill Gorcunov 		pr_warning("Config tap device error. Are you root?");
3453b02f580SSasha Levin 		goto fail;
3463b02f580SSasha Levin 	}
3474f56d42cSAsias He 
3487668c3a6SSasha Levin 	hdr_len = has_virtio_feature(ndev, VIRTIO_NET_F_MRG_RXBUF) ?
34948c6b47aSSasha Levin 			sizeof(struct virtio_net_hdr_mrg_rxbuf) :
35048c6b47aSSasha Levin 			sizeof(struct virtio_net_hdr);
3519a6d73f1SSasha Levin 	if (ioctl(ndev->tap_fd, TUNSETVNETHDRSZ, &hdr_len) < 0)
3524542f276SCyrill Gorcunov 		pr_warning("Config tap device TUNSETVNETHDRSZ error");
353246c8347SAsias He 
354246c8347SAsias He 	offload = TUN_F_CSUM | TUN_F_TSO4 | TUN_F_TSO6 | TUN_F_UFO;
3559a6d73f1SSasha Levin 	if (ioctl(ndev->tap_fd, TUNSETOFFLOAD, offload) < 0) {
3564542f276SCyrill Gorcunov 		pr_warning("Config tap device TUNSETOFFLOAD error");
357246c8347SAsias He 		goto fail;
358246c8347SAsias He 	}
3594f56d42cSAsias He 
36073b7d038SAmos Kong 	if (strcmp(params->script, "none")) {
361*eef27ae3SFan Du 		if (virtio_net_exec_script(params->script, ndev->tap_name) < 0)
36273b7d038SAmos Kong 			goto fail;
3631dfc7c24SMarc Zyngier 	} else if (!skipconf) {
364cb7202c1SSasha Levin 		memset(&ifr, 0, sizeof(ifr));
3659a6d73f1SSasha Levin 		strncpy(ifr.ifr_name, ndev->tap_name, sizeof(ndev->tap_name));
366bdfcfca6SSasha Levin 		sin.sin_addr.s_addr = inet_addr(params->host_ip);
367cb7202c1SSasha Levin 		memcpy(&(ifr.ifr_addr), &sin, sizeof(ifr.ifr_addr));
368cb7202c1SSasha Levin 		ifr.ifr_addr.sa_family = AF_INET;
3693b02f580SSasha Levin 		if (ioctl(sock, SIOCSIFADDR, &ifr) < 0) {
3704542f276SCyrill Gorcunov 			pr_warning("Could not set ip address on tap device");
3713b02f580SSasha Levin 			goto fail;
3723b02f580SSasha Levin 		}
37373b7d038SAmos Kong 	}
374cb7202c1SSasha Levin 
3751dfc7c24SMarc Zyngier 	if (!skipconf) {
376cb7202c1SSasha Levin 		memset(&ifr, 0, sizeof(ifr));
3779a6d73f1SSasha Levin 		strncpy(ifr.ifr_name, ndev->tap_name, sizeof(ndev->tap_name));
378cb7202c1SSasha Levin 		ioctl(sock, SIOCGIFFLAGS, &ifr);
379cb7202c1SSasha Levin 		ifr.ifr_flags |= IFF_UP | IFF_RUNNING;
380cb7202c1SSasha Levin 		if (ioctl(sock, SIOCSIFFLAGS, &ifr) < 0)
3814542f276SCyrill Gorcunov 			pr_warning("Could not bring tap device up");
3821dfc7c24SMarc Zyngier 	}
383cb7202c1SSasha Levin 
384cb7202c1SSasha Levin 	close(sock);
3853b02f580SSasha Levin 
3863b02f580SSasha Levin 	return 1;
3873b02f580SSasha Levin 
3883b02f580SSasha Levin fail:
3893b02f580SSasha Levin 	if (sock >= 0)
3903b02f580SSasha Levin 		close(sock);
3919a6d73f1SSasha Levin 	if (ndev->tap_fd >= 0)
3929a6d73f1SSasha Levin 		close(ndev->tap_fd);
3933b02f580SSasha Levin 
3943b02f580SSasha Levin 	return 0;
3954f56d42cSAsias He }
3964f56d42cSAsias He 
397b4fdde6dSAsias He static inline int tap_ops_tx(struct iovec *iov, u16 out, struct net_dev *ndev)
398b4fdde6dSAsias He {
399b4fdde6dSAsias He 	return writev(ndev->tap_fd, iov, out);
400b4fdde6dSAsias He }
401b4fdde6dSAsias He 
402b4fdde6dSAsias He static inline int tap_ops_rx(struct iovec *iov, u16 in, struct net_dev *ndev)
403b4fdde6dSAsias He {
404b4fdde6dSAsias He 	return readv(ndev->tap_fd, iov, in);
405b4fdde6dSAsias He }
406b4fdde6dSAsias He 
407b4fdde6dSAsias He static inline int uip_ops_tx(struct iovec *iov, u16 out, struct net_dev *ndev)
408b4fdde6dSAsias He {
409b4fdde6dSAsias He 	return uip_tx(iov, out, &ndev->info);
410b4fdde6dSAsias He }
411b4fdde6dSAsias He 
412b4fdde6dSAsias He static inline int uip_ops_rx(struct iovec *iov, u16 in, struct net_dev *ndev)
413b4fdde6dSAsias He {
414b4fdde6dSAsias He 	return uip_rx(iov, in, &ndev->info);
415b4fdde6dSAsias He }
416b4fdde6dSAsias He 
417b4fdde6dSAsias He static struct net_dev_operations tap_ops = {
418b4fdde6dSAsias He 	.rx	= tap_ops_rx,
419b4fdde6dSAsias He 	.tx	= tap_ops_tx,
420b4fdde6dSAsias He };
421b4fdde6dSAsias He 
422b4fdde6dSAsias He static struct net_dev_operations uip_ops = {
423b4fdde6dSAsias He 	.rx	= uip_ops_rx,
424b4fdde6dSAsias He 	.tx	= uip_ops_tx,
425b4fdde6dSAsias He };
426b4fdde6dSAsias He 
427c5ae742bSSasha Levin static u8 *get_config(struct kvm *kvm, void *dev)
42878a2a3e2SSasha Levin {
42978a2a3e2SSasha Levin 	struct net_dev *ndev = dev;
43078a2a3e2SSasha Levin 
431c5ae742bSSasha Levin 	return ((u8 *)(&ndev->config));
43278a2a3e2SSasha Levin }
43378a2a3e2SSasha Levin 
43478a2a3e2SSasha Levin static u32 get_host_features(struct kvm *kvm, void *dev)
43578a2a3e2SSasha Levin {
43679052597SSasha Levin 	struct net_dev *ndev = dev;
43779052597SSasha Levin 
43878a2a3e2SSasha Levin 	return 1UL << VIRTIO_NET_F_MAC
43978a2a3e2SSasha Levin 		| 1UL << VIRTIO_NET_F_CSUM
44078a2a3e2SSasha Levin 		| 1UL << VIRTIO_NET_F_HOST_UFO
44178a2a3e2SSasha Levin 		| 1UL << VIRTIO_NET_F_HOST_TSO4
44278a2a3e2SSasha Levin 		| 1UL << VIRTIO_NET_F_HOST_TSO6
44378a2a3e2SSasha Levin 		| 1UL << VIRTIO_NET_F_GUEST_UFO
44478a2a3e2SSasha Levin 		| 1UL << VIRTIO_NET_F_GUEST_TSO4
44592c1f37bSSasha Levin 		| 1UL << VIRTIO_NET_F_GUEST_TSO6
446754c8ce3SSasha Levin 		| 1UL << VIRTIO_RING_F_EVENT_IDX
447abd4a801SSasha Levin 		| 1UL << VIRTIO_RING_F_INDIRECT_DESC
4486585ffb7SSasha Levin 		| 1UL << VIRTIO_NET_F_CTRL_VQ
4497668c3a6SSasha Levin 		| 1UL << VIRTIO_NET_F_MRG_RXBUF
45079052597SSasha Levin 		| 1UL << (ndev->queue_pairs > 1 ? VIRTIO_NET_F_MQ : 0);
45178a2a3e2SSasha Levin }
45278a2a3e2SSasha Levin 
45315636d5eSYing-Shiuan Pan static int virtio_net__vhost_set_features(struct net_dev *ndev)
45415636d5eSYing-Shiuan Pan {
45515636d5eSYing-Shiuan Pan 	u64 features = 1UL << VIRTIO_RING_F_EVENT_IDX;
45615636d5eSYing-Shiuan Pan 	u64 vhost_features;
45715636d5eSYing-Shiuan Pan 
45815636d5eSYing-Shiuan Pan 	if (ioctl(ndev->vhost_fd, VHOST_GET_FEATURES, &vhost_features) != 0)
45915636d5eSYing-Shiuan Pan 		die_perror("VHOST_GET_FEATURES failed");
46015636d5eSYing-Shiuan Pan 
46115636d5eSYing-Shiuan Pan 	/* make sure both side support mergable rx buffers */
46215636d5eSYing-Shiuan Pan 	if (vhost_features & 1UL << VIRTIO_NET_F_MRG_RXBUF &&
46315636d5eSYing-Shiuan Pan 			has_virtio_feature(ndev, VIRTIO_NET_F_MRG_RXBUF))
46415636d5eSYing-Shiuan Pan 		features |= 1UL << VIRTIO_NET_F_MRG_RXBUF;
46515636d5eSYing-Shiuan Pan 
46615636d5eSYing-Shiuan Pan 	return ioctl(ndev->vhost_fd, VHOST_SET_FEATURES, &features);
46715636d5eSYing-Shiuan Pan }
46815636d5eSYing-Shiuan Pan 
46978a2a3e2SSasha Levin static void set_guest_features(struct kvm *kvm, void *dev, u32 features)
47078a2a3e2SSasha Levin {
47178a2a3e2SSasha Levin 	struct net_dev *ndev = dev;
4728ed60bbeSMarc Zyngier 	struct virtio_net_config *conf = &ndev->config;
47378a2a3e2SSasha Levin 
47478a2a3e2SSasha Levin 	ndev->features = features;
4758aa155c4SYing-Shiuan Pan 
4768ed60bbeSMarc Zyngier 	conf->status = virtio_host_to_guest_u16(&ndev->vdev, conf->status);
4778ed60bbeSMarc Zyngier 	conf->max_virtqueue_pairs = virtio_host_to_guest_u16(&ndev->vdev,
4788ed60bbeSMarc Zyngier 							     conf->max_virtqueue_pairs);
4798ed60bbeSMarc Zyngier 
4808aa155c4SYing-Shiuan Pan 	if (ndev->mode == NET_MODE_TAP) {
4818aa155c4SYing-Shiuan Pan 		if (!virtio_net__tap_init(ndev))
4828aa155c4SYing-Shiuan Pan 			die_perror("You have requested a TAP device, but creation of one has failed because");
48315636d5eSYing-Shiuan Pan 		if (ndev->vhost_fd &&
48415636d5eSYing-Shiuan Pan 				virtio_net__vhost_set_features(ndev) != 0)
48515636d5eSYing-Shiuan Pan 			die_perror("VHOST_SET_FEATURES failed");
4868aa155c4SYing-Shiuan Pan 	} else {
4878aa155c4SYing-Shiuan Pan 		ndev->info.vnet_hdr_len = has_virtio_feature(ndev, VIRTIO_NET_F_MRG_RXBUF) ?
4888aa155c4SYing-Shiuan Pan 						sizeof(struct virtio_net_hdr_mrg_rxbuf) :
4898aa155c4SYing-Shiuan Pan 						sizeof(struct virtio_net_hdr);
4908aa155c4SYing-Shiuan Pan 		uip_init(&ndev->info);
4918aa155c4SYing-Shiuan Pan 	}
49278a2a3e2SSasha Levin }
49378a2a3e2SSasha Levin 
4949e56ec14SSasha Levin static bool is_ctrl_vq(struct net_dev *ndev, u32 vq)
4959e56ec14SSasha Levin {
4969e56ec14SSasha Levin 	return vq == (u32)(ndev->queue_pairs * 2);
4979e56ec14SSasha Levin }
4989e56ec14SSasha Levin 
499c59ba304SWill Deacon static int init_vq(struct kvm *kvm, void *dev, u32 vq, u32 page_size, u32 align,
500c59ba304SWill Deacon 		   u32 pfn)
50178a2a3e2SSasha Levin {
5029ed67cdcSSasha Levin 	struct vhost_vring_state state = { .index = vq };
5039ed67cdcSSasha Levin 	struct vhost_vring_addr addr;
50478a2a3e2SSasha Levin 	struct net_dev *ndev = dev;
50578a2a3e2SSasha Levin 	struct virt_queue *queue;
50678a2a3e2SSasha Levin 	void *p;
5079ed67cdcSSasha Levin 	int r;
50878a2a3e2SSasha Levin 
509312c62d1SSasha Levin 	compat__remove_message(compat_id);
51078a2a3e2SSasha Levin 
51178a2a3e2SSasha Levin 	queue		= &ndev->vqs[vq];
51278a2a3e2SSasha Levin 	queue->pfn	= pfn;
513e7e2950aSSasha Levin 	p		= virtio_get_vq(kvm, queue->pfn, page_size);
51478a2a3e2SSasha Levin 
515c59ba304SWill Deacon 	vring_init(&queue->vring, VIRTIO_NET_QUEUE_SIZE, p, align);
5168ed60bbeSMarc Zyngier 	virtio_init_device_vq(&ndev->vdev, queue);
51778a2a3e2SSasha Levin 
5186585ffb7SSasha Levin 	mutex_init(&ndev->io_lock[vq]);
5196585ffb7SSasha Levin 	pthread_cond_init(&ndev->io_cond[vq], NULL);
5209e56ec14SSasha Levin 	if (is_ctrl_vq(ndev, vq)) {
5216585ffb7SSasha Levin 		pthread_create(&ndev->io_thread[vq], NULL, virtio_net_ctrl_thread, ndev);
5229e56ec14SSasha Levin 
5239e56ec14SSasha Levin 		return 0;
5249e56ec14SSasha Levin 	} else if (ndev->vhost_fd == 0 ) {
5259e56ec14SSasha Levin 		if (vq & 1)
5266585ffb7SSasha Levin 			pthread_create(&ndev->io_thread[vq], NULL, virtio_net_tx_thread, ndev);
5276585ffb7SSasha Levin 		else
5286585ffb7SSasha Levin 			pthread_create(&ndev->io_thread[vq], NULL, virtio_net_rx_thread, ndev);
5296585ffb7SSasha Levin 
53078a2a3e2SSasha Levin 		return 0;
5316585ffb7SSasha Levin 	}
5329ed67cdcSSasha Levin 
5338ed60bbeSMarc Zyngier 	if (queue->endian != VIRTIO_ENDIAN_HOST)
5348ed60bbeSMarc Zyngier 		die_perror("VHOST requires VIRTIO_ENDIAN_HOST");
5358ed60bbeSMarc Zyngier 
5369ed67cdcSSasha Levin 	state.num = queue->vring.num;
5379ed67cdcSSasha Levin 	r = ioctl(ndev->vhost_fd, VHOST_SET_VRING_NUM, &state);
5389ed67cdcSSasha Levin 	if (r < 0)
5399ed67cdcSSasha Levin 		die_perror("VHOST_SET_VRING_NUM failed");
5409ed67cdcSSasha Levin 	state.num = 0;
5419ed67cdcSSasha Levin 	r = ioctl(ndev->vhost_fd, VHOST_SET_VRING_BASE, &state);
5429ed67cdcSSasha Levin 	if (r < 0)
5439ed67cdcSSasha Levin 		die_perror("VHOST_SET_VRING_BASE failed");
5449ed67cdcSSasha Levin 
5459ed67cdcSSasha Levin 	addr = (struct vhost_vring_addr) {
5469ed67cdcSSasha Levin 		.index = vq,
5479ed67cdcSSasha Levin 		.desc_user_addr = (u64)(unsigned long)queue->vring.desc,
5489ed67cdcSSasha Levin 		.avail_user_addr = (u64)(unsigned long)queue->vring.avail,
5499ed67cdcSSasha Levin 		.used_user_addr = (u64)(unsigned long)queue->vring.used,
5509ed67cdcSSasha Levin 	};
5519ed67cdcSSasha Levin 
5529ed67cdcSSasha Levin 	r = ioctl(ndev->vhost_fd, VHOST_SET_VRING_ADDR, &addr);
5539ed67cdcSSasha Levin 	if (r < 0)
5549ed67cdcSSasha Levin 		die_perror("VHOST_SET_VRING_ADDR failed");
5559ed67cdcSSasha Levin 
5569ed67cdcSSasha Levin 	return 0;
5579ed67cdcSSasha Levin }
5589ed67cdcSSasha Levin 
5599ed67cdcSSasha Levin static void notify_vq_gsi(struct kvm *kvm, void *dev, u32 vq, u32 gsi)
5609ed67cdcSSasha Levin {
5619ed67cdcSSasha Levin 	struct net_dev *ndev = dev;
5629ed67cdcSSasha Levin 	struct kvm_irqfd irq;
5639ed67cdcSSasha Levin 	struct vhost_vring_file file;
5649ed67cdcSSasha Levin 	int r;
5659ed67cdcSSasha Levin 
5669ed67cdcSSasha Levin 	if (ndev->vhost_fd == 0)
5679ed67cdcSSasha Levin 		return;
5689ed67cdcSSasha Levin 
5699ed67cdcSSasha Levin 	irq = (struct kvm_irqfd) {
5709ed67cdcSSasha Levin 		.gsi	= gsi,
5719ed67cdcSSasha Levin 		.fd	= eventfd(0, 0),
5729ed67cdcSSasha Levin 	};
5739ed67cdcSSasha Levin 	file = (struct vhost_vring_file) {
5749ed67cdcSSasha Levin 		.index	= vq,
5759ed67cdcSSasha Levin 		.fd	= irq.fd,
5769ed67cdcSSasha Levin 	};
5779ed67cdcSSasha Levin 
5789ed67cdcSSasha Levin 	r = ioctl(kvm->vm_fd, KVM_IRQFD, &irq);
5799ed67cdcSSasha Levin 	if (r < 0)
5809ed67cdcSSasha Levin 		die_perror("KVM_IRQFD failed");
5819ed67cdcSSasha Levin 
5829ed67cdcSSasha Levin 	r = ioctl(ndev->vhost_fd, VHOST_SET_VRING_CALL, &file);
5839ed67cdcSSasha Levin 	if (r < 0)
5849ed67cdcSSasha Levin 		die_perror("VHOST_SET_VRING_CALL failed");
5859ed67cdcSSasha Levin 	file.fd = ndev->tap_fd;
5869ed67cdcSSasha Levin 	r = ioctl(ndev->vhost_fd, VHOST_NET_SET_BACKEND, &file);
5879ed67cdcSSasha Levin 	if (r != 0)
5889ed67cdcSSasha Levin 		die("VHOST_NET_SET_BACKEND failed %d", errno);
5899ed67cdcSSasha Levin 
5909ed67cdcSSasha Levin }
5919ed67cdcSSasha Levin 
5929ed67cdcSSasha Levin static void notify_vq_eventfd(struct kvm *kvm, void *dev, u32 vq, u32 efd)
5939ed67cdcSSasha Levin {
5949ed67cdcSSasha Levin 	struct net_dev *ndev = dev;
5959ed67cdcSSasha Levin 	struct vhost_vring_file file = {
5969ed67cdcSSasha Levin 		.index	= vq,
5979ed67cdcSSasha Levin 		.fd	= efd,
5989ed67cdcSSasha Levin 	};
5999ed67cdcSSasha Levin 	int r;
6009ed67cdcSSasha Levin 
6019e56ec14SSasha Levin 	if (ndev->vhost_fd == 0 || is_ctrl_vq(ndev, vq))
6029ed67cdcSSasha Levin 		return;
6039ed67cdcSSasha Levin 
6049ed67cdcSSasha Levin 	r = ioctl(ndev->vhost_fd, VHOST_SET_VRING_KICK, &file);
6059ed67cdcSSasha Levin 	if (r < 0)
6069ed67cdcSSasha Levin 		die_perror("VHOST_SET_VRING_KICK failed");
60778a2a3e2SSasha Levin }
60878a2a3e2SSasha Levin 
60978a2a3e2SSasha Levin static int notify_vq(struct kvm *kvm, void *dev, u32 vq)
61078a2a3e2SSasha Levin {
6119a6d73f1SSasha Levin 	struct net_dev *ndev = dev;
6129a6d73f1SSasha Levin 
6139a6d73f1SSasha Levin 	virtio_net_handle_callback(kvm, ndev, vq);
61478a2a3e2SSasha Levin 
61578a2a3e2SSasha Levin 	return 0;
61678a2a3e2SSasha Levin }
61778a2a3e2SSasha Levin 
61878a2a3e2SSasha Levin static int get_pfn_vq(struct kvm *kvm, void *dev, u32 vq)
61978a2a3e2SSasha Levin {
62078a2a3e2SSasha Levin 	struct net_dev *ndev = dev;
62178a2a3e2SSasha Levin 
62278a2a3e2SSasha Levin 	return ndev->vqs[vq].pfn;
62378a2a3e2SSasha Levin }
62478a2a3e2SSasha Levin 
62578a2a3e2SSasha Levin static int get_size_vq(struct kvm *kvm, void *dev, u32 vq)
62678a2a3e2SSasha Levin {
6270f4f51a8SAsias He 	/* FIXME: dynamic */
62878a2a3e2SSasha Levin 	return VIRTIO_NET_QUEUE_SIZE;
62978a2a3e2SSasha Levin }
63078a2a3e2SSasha Levin 
6310f4f51a8SAsias He static int set_size_vq(struct kvm *kvm, void *dev, u32 vq, int size)
6320f4f51a8SAsias He {
6330f4f51a8SAsias He 	/* FIXME: dynamic */
6340f4f51a8SAsias He 	return size;
6350f4f51a8SAsias He }
6360f4f51a8SAsias He 
63715542babSAndre Przywara static struct virtio_ops net_dev_virtio_ops = {
6381c47ce69SSasha Levin 	.get_config		= get_config,
6391c47ce69SSasha Levin 	.get_host_features	= get_host_features,
6401c47ce69SSasha Levin 	.set_guest_features	= set_guest_features,
6411c47ce69SSasha Levin 	.init_vq		= init_vq,
6421c47ce69SSasha Levin 	.get_pfn_vq		= get_pfn_vq,
6431c47ce69SSasha Levin 	.get_size_vq		= get_size_vq,
6440f4f51a8SAsias He 	.set_size_vq		= set_size_vq,
6450f4f51a8SAsias He 	.notify_vq		= notify_vq,
6469ed67cdcSSasha Levin 	.notify_vq_gsi		= notify_vq_gsi,
6479ed67cdcSSasha Levin 	.notify_vq_eventfd	= notify_vq_eventfd,
6481c47ce69SSasha Levin };
6491c47ce69SSasha Levin 
6509ed67cdcSSasha Levin static void virtio_net__vhost_init(struct kvm *kvm, struct net_dev *ndev)
6519ed67cdcSSasha Levin {
6527f9733c2SAndreas Herrmann 	struct kvm_mem_bank *bank;
6539ed67cdcSSasha Levin 	struct vhost_memory *mem;
6547f9733c2SAndreas Herrmann 	int r, i;
6559ed67cdcSSasha Levin 
6569ed67cdcSSasha Levin 	ndev->vhost_fd = open("/dev/vhost-net", O_RDWR);
6579ed67cdcSSasha Levin 	if (ndev->vhost_fd < 0)
6589ed67cdcSSasha Levin 		die_perror("Failed openning vhost-net device");
6599ed67cdcSSasha Levin 
6607f9733c2SAndreas Herrmann 	mem = calloc(1, sizeof(*mem) + kvm->mem_slots * sizeof(struct vhost_memory_region));
6619ed67cdcSSasha Levin 	if (mem == NULL)
6629ed67cdcSSasha Levin 		die("Failed allocating memory for vhost memory map");
6639ed67cdcSSasha Levin 
6647f9733c2SAndreas Herrmann 	i = 0;
6657f9733c2SAndreas Herrmann 	list_for_each_entry(bank, &kvm->mem_banks, list) {
6667f9733c2SAndreas Herrmann 		mem->regions[i] = (struct vhost_memory_region) {
6677f9733c2SAndreas Herrmann 			.guest_phys_addr = bank->guest_phys_addr,
6687f9733c2SAndreas Herrmann 			.memory_size	 = bank->size,
6697f9733c2SAndreas Herrmann 			.userspace_addr	 = (unsigned long)bank->host_addr,
6709ed67cdcSSasha Levin 		};
6717f9733c2SAndreas Herrmann 		i++;
6727f9733c2SAndreas Herrmann 	}
6737f9733c2SAndreas Herrmann 	mem->nregions = i;
6749ed67cdcSSasha Levin 
6759ed67cdcSSasha Levin 	r = ioctl(ndev->vhost_fd, VHOST_SET_OWNER);
6769ed67cdcSSasha Levin 	if (r != 0)
6779ed67cdcSSasha Levin 		die_perror("VHOST_SET_OWNER failed");
6789ed67cdcSSasha Levin 
6799ed67cdcSSasha Levin 	r = ioctl(ndev->vhost_fd, VHOST_SET_MEM_TABLE, mem);
6809ed67cdcSSasha Levin 	if (r != 0)
6819ed67cdcSSasha Levin 		die_perror("VHOST_SET_MEM_TABLE failed");
682627d6874SAsias He 
683627d6874SAsias He 	ndev->vdev.use_vhost = true;
684627d6874SAsias He 
6859ed67cdcSSasha Levin 	free(mem);
6869ed67cdcSSasha Levin }
6879ed67cdcSSasha Levin 
6885f225124SSasha Levin static inline void str_to_mac(const char *str, char *mac)
6895f225124SSasha Levin {
6905f225124SSasha Levin 	sscanf(str, "%hhx:%hhx:%hhx:%hhx:%hhx:%hhx",
6915f225124SSasha Levin 		mac, mac+1, mac+2, mac+3, mac+4, mac+5);
6925f225124SSasha Levin }
6934346fd8fSSasha Levin static int set_net_param(struct kvm *kvm, struct virtio_net_params *p,
6944346fd8fSSasha Levin 			const char *param, const char *val)
6955f225124SSasha Levin {
6965f225124SSasha Levin 	if (strcmp(param, "guest_mac") == 0) {
6975f225124SSasha Levin 		str_to_mac(val, p->guest_mac);
6985f225124SSasha Levin 	} else if (strcmp(param, "mode") == 0) {
6995f225124SSasha Levin 		if (!strncmp(val, "user", 4)) {
7005f225124SSasha Levin 			int i;
7015f225124SSasha Levin 
7025f225124SSasha Levin 			for (i = 0; i < kvm->cfg.num_net_devices; i++)
7035f225124SSasha Levin 				if (kvm->cfg.net_params[i].mode == NET_MODE_USER)
7045f225124SSasha Levin 					die("Only one usermode network device allowed at a time");
7055f225124SSasha Levin 			p->mode = NET_MODE_USER;
7065f225124SSasha Levin 		} else if (!strncmp(val, "tap", 3)) {
7075f225124SSasha Levin 			p->mode = NET_MODE_TAP;
7085f225124SSasha Levin 		} else if (!strncmp(val, "none", 4)) {
7095f225124SSasha Levin 			kvm->cfg.no_net = 1;
7105f225124SSasha Levin 			return -1;
7115f225124SSasha Levin 		} else
7125f225124SSasha Levin 			die("Unknown network mode %s, please use user, tap or none", kvm->cfg.network);
7135f225124SSasha Levin 	} else if (strcmp(param, "script") == 0) {
7145f225124SSasha Levin 		p->script = strdup(val);
715*eef27ae3SFan Du 	} else if (strcmp(param, "downscript") == 0) {
716*eef27ae3SFan Du 		p->downscript = strdup(val);
7175f225124SSasha Levin 	} else if (strcmp(param, "guest_ip") == 0) {
7185f225124SSasha Levin 		p->guest_ip = strdup(val);
7195f225124SSasha Levin 	} else if (strcmp(param, "host_ip") == 0) {
7205f225124SSasha Levin 		p->host_ip = strdup(val);
7215f225124SSasha Levin 	} else if (strcmp(param, "trans") == 0) {
7225f225124SSasha Levin 		p->trans = strdup(val);
7231dfc7c24SMarc Zyngier 	} else if (strcmp(param, "tapif") == 0) {
7241dfc7c24SMarc Zyngier 		p->tapif = strdup(val);
7255f225124SSasha Levin 	} else if (strcmp(param, "vhost") == 0) {
7265f225124SSasha Levin 		p->vhost = atoi(val);
7275f225124SSasha Levin 	} else if (strcmp(param, "fd") == 0) {
7285f225124SSasha Levin 		p->fd = atoi(val);
72979052597SSasha Levin 	} else if (strcmp(param, "mq") == 0) {
73079052597SSasha Levin 		p->mq = atoi(val);
7315f225124SSasha Levin 	} else
7325f225124SSasha Levin 		die("Unknown network parameter %s", param);
7335f225124SSasha Levin 
7345f225124SSasha Levin 	return 0;
7355f225124SSasha Levin }
7365f225124SSasha Levin 
7375f225124SSasha Levin int netdev_parser(const struct option *opt, const char *arg, int unset)
7385f225124SSasha Levin {
7395f225124SSasha Levin 	struct virtio_net_params p;
7405f225124SSasha Levin 	char *buf = NULL, *cmd = NULL, *cur = NULL;
7415f225124SSasha Levin 	bool on_cmd = true;
7425f225124SSasha Levin 	struct kvm *kvm = opt->ptr;
7435f225124SSasha Levin 
7445f225124SSasha Levin 	if (arg) {
7455f225124SSasha Levin 		buf = strdup(arg);
7465f225124SSasha Levin 		if (buf == NULL)
7475f225124SSasha Levin 			die("Failed allocating new net buffer");
7485f225124SSasha Levin 		cur = strtok(buf, ",=");
7495f225124SSasha Levin 	}
7505f225124SSasha Levin 
7515f225124SSasha Levin 	p = (struct virtio_net_params) {
7525f225124SSasha Levin 		.guest_ip	= DEFAULT_GUEST_ADDR,
7535f225124SSasha Levin 		.host_ip	= DEFAULT_HOST_ADDR,
7545f225124SSasha Levin 		.script		= DEFAULT_SCRIPT,
755*eef27ae3SFan Du 		.downscript	= DEFAULT_SCRIPT,
7565f225124SSasha Levin 		.mode		= NET_MODE_TAP,
7575f225124SSasha Levin 	};
7585f225124SSasha Levin 
7595f225124SSasha Levin 	str_to_mac(DEFAULT_GUEST_MAC, p.guest_mac);
7605f225124SSasha Levin 	p.guest_mac[5] += kvm->cfg.num_net_devices;
7615f225124SSasha Levin 
7625f225124SSasha Levin 	while (cur) {
7635f225124SSasha Levin 		if (on_cmd) {
7645f225124SSasha Levin 			cmd = cur;
7655f225124SSasha Levin 		} else {
7664346fd8fSSasha Levin 			if (set_net_param(kvm, &p, cmd, cur) < 0)
7675f225124SSasha Levin 				goto done;
7685f225124SSasha Levin 		}
7695f225124SSasha Levin 		on_cmd = !on_cmd;
7705f225124SSasha Levin 
7715f225124SSasha Levin 		cur = strtok(NULL, ",=");
7725f225124SSasha Levin 	};
7735f225124SSasha Levin 
7745f225124SSasha Levin 	kvm->cfg.num_net_devices++;
7755f225124SSasha Levin 
7765f225124SSasha Levin 	kvm->cfg.net_params = realloc(kvm->cfg.net_params, kvm->cfg.num_net_devices * sizeof(*kvm->cfg.net_params));
7775f225124SSasha Levin 	if (kvm->cfg.net_params == NULL)
7785f225124SSasha Levin 		die("Failed adding new network device");
7795f225124SSasha Levin 
7805f225124SSasha Levin 	kvm->cfg.net_params[kvm->cfg.num_net_devices - 1] = p;
7815f225124SSasha Levin 
7825f225124SSasha Levin done:
7835f225124SSasha Levin 	free(buf);
7845f225124SSasha Levin 	return 0;
7855f225124SSasha Levin }
7865f225124SSasha Levin 
7875f225124SSasha Levin static int virtio_net__init_one(struct virtio_net_params *params)
7884f56d42cSAsias He {
78976a4aac6SWill Deacon 	int i, err;
7909a6d73f1SSasha Levin 	struct net_dev *ndev;
79176a4aac6SWill Deacon 	struct virtio_ops *ops;
792dc7a55d6SSuzuki K. Poulose 	enum virtio_trans trans = VIRTIO_DEFAULT_TRANS(params->kvm);
7939a6d73f1SSasha Levin 
7949a6d73f1SSasha Levin 	ndev = calloc(1, sizeof(struct net_dev));
7959a6d73f1SSasha Levin 	if (ndev == NULL)
7965f225124SSasha Levin 		return -ENOMEM;
7979a6d73f1SSasha Levin 
79876a4aac6SWill Deacon 	ops = malloc(sizeof(*ops));
79976a4aac6SWill Deacon 	if (ops == NULL) {
80076a4aac6SWill Deacon 		err = -ENOMEM;
80176a4aac6SWill Deacon 		goto err_free_ndev;
80276a4aac6SWill Deacon 	}
80376a4aac6SWill Deacon 
8049a6d73f1SSasha Levin 	list_add_tail(&ndev->list, &ndevs);
8059a6d73f1SSasha Levin 
8069a6d73f1SSasha Levin 	ndev->kvm = params->kvm;
8078c0ae74dSSasha Levin 	ndev->params = params;
8089a6d73f1SSasha Levin 
8099a6d73f1SSasha Levin 	mutex_init(&ndev->mutex);
81079052597SSasha Levin 	ndev->queue_pairs = max(1, min(VIRTIO_NET_NUM_QUEUES, params->mq));
8119a6d73f1SSasha Levin 	ndev->config.status = VIRTIO_NET_S_LINK_UP;
81279052597SSasha Levin 	if (ndev->queue_pairs > 1)
81379052597SSasha Levin 		ndev->config.max_virtqueue_pairs = ndev->queue_pairs;
81479052597SSasha Levin 
8150c54698eSAsias He 	for (i = 0 ; i < 6 ; i++) {
8169a6d73f1SSasha Levin 		ndev->config.mac[i]		= params->guest_mac[i];
8179a6d73f1SSasha Levin 		ndev->info.guest_mac.addr[i]	= params->guest_mac[i];
8189a6d73f1SSasha Levin 		ndev->info.host_mac.addr[i]	= params->host_mac[i];
8190c54698eSAsias He 	}
820f715177dSAsias He 
8219a6d73f1SSasha Levin 	ndev->mode = params->mode;
8229a6d73f1SSasha Levin 	if (ndev->mode == NET_MODE_TAP) {
8239a6d73f1SSasha Levin 		ndev->ops = &tap_ops;
824b4fdde6dSAsias He 	} else {
8259a6d73f1SSasha Levin 		ndev->info.host_ip		= ntohl(inet_addr(params->host_ip));
8269a6d73f1SSasha Levin 		ndev->info.guest_ip		= ntohl(inet_addr(params->guest_ip));
8279a6d73f1SSasha Levin 		ndev->info.guest_netmask	= ntohl(inet_addr("255.255.255.0"));
8289a6d73f1SSasha Levin 		ndev->info.buf_nr		= 20,
8299a6d73f1SSasha Levin 		ndev->ops = &uip_ops;
8305f3aaf22SMarc Zyngier 		uip_static_init(&ndev->info);
831b4fdde6dSAsias He 	}
832b5ee1ea7SAsias He 
83376a4aac6SWill Deacon 	*ops = net_dev_virtio_ops;
834dc7a55d6SSuzuki K. Poulose 
835dc7a55d6SSuzuki K. Poulose 	if (params->trans) {
836dc7a55d6SSuzuki K. Poulose 		if (strcmp(params->trans, "mmio") == 0)
837dc7a55d6SSuzuki K. Poulose 			trans = VIRTIO_MMIO;
838dc7a55d6SSuzuki K. Poulose 		else if (strcmp(params->trans, "pci") == 0)
839dc7a55d6SSuzuki K. Poulose 			trans = VIRTIO_PCI;
84069205aa1SAsias He 		else
841dc7a55d6SSuzuki K. Poulose 			pr_warning("virtio-net: Unknown transport method : %s, "
842dc7a55d6SSuzuki K. Poulose 				   "falling back to %s.", params->trans,
843dc7a55d6SSuzuki K. Poulose 				   virtio_trans_name(trans));
844dc7a55d6SSuzuki K. Poulose 	}
845dc7a55d6SSuzuki K. Poulose 
846dc7a55d6SSuzuki K. Poulose 	virtio_init(params->kvm, ndev, &ndev->vdev, ops, trans,
84776a4aac6SWill Deacon 		    PCI_DEVICE_ID_VIRTIO_NET, VIRTIO_ID_NET, PCI_CLASS_NET);
84827ab67f5SSasha Levin 
8499ed67cdcSSasha Levin 	if (params->vhost)
8509ed67cdcSSasha Levin 		virtio_net__vhost_init(params->kvm, ndev);
851cb83de6fSSasha Levin 
852d278197dSAsias He 	if (compat_id == -1)
85352f34d2cSAsias He 		compat_id = virtio_compat_add_message("virtio-net", "CONFIG_VIRTIO_NET");
8545f225124SSasha Levin 
8555f225124SSasha Levin 	return 0;
85676a4aac6SWill Deacon 
85776a4aac6SWill Deacon err_free_ndev:
85876a4aac6SWill Deacon 	free(ndev);
85976a4aac6SWill Deacon 	return err;
8605f225124SSasha Levin }
8615f225124SSasha Levin 
8625f225124SSasha Levin int virtio_net__init(struct kvm *kvm)
8635f225124SSasha Levin {
8645f225124SSasha Levin 	int i;
8655f225124SSasha Levin 
8665f225124SSasha Levin 	for (i = 0; i < kvm->cfg.num_net_devices; i++) {
8675f225124SSasha Levin 		kvm->cfg.net_params[i].kvm = kvm;
8685f225124SSasha Levin 		virtio_net__init_one(&kvm->cfg.net_params[i]);
8695f225124SSasha Levin 	}
8705f225124SSasha Levin 
8715f225124SSasha Levin 	if (kvm->cfg.num_net_devices == 0 && kvm->cfg.no_net == 0) {
8728c0ae74dSSasha Levin 		static struct virtio_net_params net_params;
8735f225124SSasha Levin 
8745f225124SSasha Levin 		net_params = (struct virtio_net_params) {
8755f225124SSasha Levin 			.guest_ip	= kvm->cfg.guest_ip,
8765f225124SSasha Levin 			.host_ip	= kvm->cfg.host_ip,
8775f225124SSasha Levin 			.kvm		= kvm,
8785f225124SSasha Levin 			.script		= kvm->cfg.script,
8795f225124SSasha Levin 			.mode		= NET_MODE_USER,
8805f225124SSasha Levin 		};
8815f225124SSasha Levin 		str_to_mac(kvm->cfg.guest_mac, net_params.guest_mac);
8825f225124SSasha Levin 		str_to_mac(kvm->cfg.host_mac, net_params.host_mac);
8835f225124SSasha Levin 
8845f225124SSasha Levin 		virtio_net__init_one(&net_params);
8855f225124SSasha Levin 	}
8865f225124SSasha Levin 
8875f225124SSasha Levin 	return 0;
8885f225124SSasha Levin }
88949a8afd1SSasha Levin virtio_dev_init(virtio_net__init);
8905f225124SSasha Levin 
8915f225124SSasha Levin int virtio_net__exit(struct kvm *kvm)
8925f225124SSasha Levin {
893*eef27ae3SFan Du 	struct virtio_net_params *params;
894*eef27ae3SFan Du 	struct net_dev *ndev;
895*eef27ae3SFan Du 	struct list_head *ptr;
896*eef27ae3SFan Du 
897*eef27ae3SFan Du 	list_for_each(ptr, &ndevs) {
898*eef27ae3SFan Du 		ndev = list_entry(ptr, struct net_dev, list);
899*eef27ae3SFan Du 		params = ndev->params;
900*eef27ae3SFan Du 		/* Cleanup any tap device which attached to bridge */
901*eef27ae3SFan Du 		if (ndev->mode == NET_MODE_TAP &&
902*eef27ae3SFan Du 		    strcmp(params->downscript, "none"))
903*eef27ae3SFan Du 			virtio_net_exec_script(params->downscript, ndev->tap_name);
904*eef27ae3SFan Du 	}
9055f225124SSasha Levin 	return 0;
9064f56d42cSAsias He }
90749a8afd1SSasha Levin virtio_dev_exit(virtio_net__exit);
908