xref: /kvmtool/virtio/net.c (revision 8ed60bbe615309b2220b4c36db7a50e3f9a9d4b0)
131638bcaSCyrill Gorcunov #include "kvm/virtio-pci-dev.h"
2b5ee1ea7SAsias He #include "kvm/virtio-net.h"
34f56d42cSAsias He #include "kvm/virtio.h"
44f56d42cSAsias He #include "kvm/types.h"
54f56d42cSAsias He #include "kvm/mutex.h"
64f56d42cSAsias He #include "kvm/util.h"
74f56d42cSAsias He #include "kvm/kvm.h"
82449f6e3SSasha Levin #include "kvm/irq.h"
9b5ee1ea7SAsias He #include "kvm/uip.h"
10cb83de6fSSasha Levin #include "kvm/guest_compat.h"
117668c3a6SSasha Levin #include "kvm/iovec.h"
124f56d42cSAsias He 
139ed67cdcSSasha Levin #include <linux/vhost.h>
144f56d42cSAsias He #include <linux/virtio_net.h>
154f56d42cSAsias He #include <linux/if_tun.h>
1678a2a3e2SSasha Levin #include <linux/types.h>
17c229370aSIngo Molnar 
18c229370aSIngo Molnar #include <arpa/inet.h>
194f56d42cSAsias He #include <net/if.h>
20c229370aSIngo Molnar 
21c229370aSIngo Molnar #include <unistd.h>
224f56d42cSAsias He #include <fcntl.h>
23c229370aSIngo Molnar 
24cb7202c1SSasha Levin #include <sys/socket.h>
25c229370aSIngo Molnar #include <sys/ioctl.h>
26c229370aSIngo Molnar #include <sys/types.h>
2773b7d038SAmos Kong #include <sys/wait.h>
289ed67cdcSSasha Levin #include <sys/eventfd.h>
294f56d42cSAsias He 
304059ad8bSAsias He #define VIRTIO_NET_QUEUE_SIZE		256
316585ffb7SSasha Levin #define VIRTIO_NET_NUM_QUEUES		8
324f56d42cSAsias He 
33b4fdde6dSAsias He struct net_dev;
34b4fdde6dSAsias He 
35b4fdde6dSAsias He struct net_dev_operations {
36b4fdde6dSAsias He 	int (*rx)(struct iovec *iov, u16 in, struct net_dev *ndev);
37b4fdde6dSAsias He 	int (*tx)(struct iovec *iov, u16 in, struct net_dev *ndev);
38b4fdde6dSAsias He };
39b4fdde6dSAsias He 
408626798bSAsias He struct net_dev {
41d3476f7dSSasha Levin 	struct mutex			mutex;
4202eca50cSAsias He 	struct virtio_device		vdev;
439a6d73f1SSasha Levin 	struct list_head		list;
444f56d42cSAsias He 
456585ffb7SSasha Levin 	struct virt_queue		vqs[VIRTIO_NET_NUM_QUEUES * 2 + 1];
46c229370aSIngo Molnar 	struct virtio_net_config	config;
4779052597SSasha Levin 	u32				features, rx_vqs, tx_vqs, queue_pairs;
484f56d42cSAsias He 
496585ffb7SSasha Levin 	pthread_t			io_thread[VIRTIO_NET_NUM_QUEUES * 2 + 1];
506585ffb7SSasha Levin 	struct mutex			io_lock[VIRTIO_NET_NUM_QUEUES * 2 + 1];
516585ffb7SSasha Levin 	pthread_cond_t			io_cond[VIRTIO_NET_NUM_QUEUES * 2 + 1];
52c4aa7c02SPekka Enberg 
539ed67cdcSSasha Levin 	int				vhost_fd;
544f56d42cSAsias He 	int				tap_fd;
554f56d42cSAsias He 	char				tap_name[IFNAMSIZ];
56bb1a32f1SAsias He 
57bb1a32f1SAsias He 	int				mode;
58bb1a32f1SAsias He 
59b5ee1ea7SAsias He 	struct uip_info			info;
60b4fdde6dSAsias He 	struct net_dev_operations	*ops;
619a6d73f1SSasha Levin 	struct kvm			*kvm;
628c0ae74dSSasha Levin 
638c0ae74dSSasha Levin 	struct virtio_net_params	*params;
644f56d42cSAsias He };
654f56d42cSAsias He 
669a6d73f1SSasha Levin static LIST_HEAD(ndevs);
67312c62d1SSasha Levin static int compat_id = -1;
684f56d42cSAsias He 
697668c3a6SSasha Levin #define MAX_PACKET_SIZE 65550
707668c3a6SSasha Levin 
717668c3a6SSasha Levin static bool has_virtio_feature(struct net_dev *ndev, u32 feature)
727668c3a6SSasha Levin {
737668c3a6SSasha Levin 	return ndev->features & (1 << feature);
747668c3a6SSasha Levin }
757668c3a6SSasha Levin 
76*8ed60bbeSMarc Zyngier static void virtio_net_fix_tx_hdr(struct virtio_net_hdr *hdr, struct net_dev *ndev)
77*8ed60bbeSMarc Zyngier {
78*8ed60bbeSMarc Zyngier 	hdr->hdr_len		= virtio_guest_to_host_u16(&ndev->vdev, hdr->hdr_len);
79*8ed60bbeSMarc Zyngier 	hdr->gso_size		= virtio_guest_to_host_u16(&ndev->vdev, hdr->gso_size);
80*8ed60bbeSMarc Zyngier 	hdr->csum_start		= virtio_guest_to_host_u16(&ndev->vdev, hdr->csum_start);
81*8ed60bbeSMarc Zyngier 	hdr->csum_offset	= virtio_guest_to_host_u16(&ndev->vdev, hdr->csum_offset);
82*8ed60bbeSMarc Zyngier }
83*8ed60bbeSMarc Zyngier 
84*8ed60bbeSMarc Zyngier static void virtio_net_fix_rx_hdr(struct virtio_net_hdr_mrg_rxbuf *hdr, struct net_dev *ndev)
85*8ed60bbeSMarc Zyngier {
86*8ed60bbeSMarc Zyngier 	hdr->hdr.hdr_len	= virtio_host_to_guest_u16(&ndev->vdev, hdr->hdr.hdr_len);
87*8ed60bbeSMarc Zyngier 	hdr->hdr.gso_size	= virtio_host_to_guest_u16(&ndev->vdev, hdr->hdr.gso_size);
88*8ed60bbeSMarc Zyngier 	hdr->hdr.csum_start	= virtio_host_to_guest_u16(&ndev->vdev, hdr->hdr.csum_start);
89*8ed60bbeSMarc Zyngier 	hdr->hdr.csum_offset	= virtio_host_to_guest_u16(&ndev->vdev, hdr->hdr.csum_offset);
90*8ed60bbeSMarc Zyngier 	if (has_virtio_feature(ndev, VIRTIO_NET_F_MRG_RXBUF))
91*8ed60bbeSMarc Zyngier 		hdr->num_buffers	= virtio_host_to_guest_u16(&ndev->vdev, hdr->num_buffers);
92*8ed60bbeSMarc Zyngier }
93*8ed60bbeSMarc Zyngier 
94c4aa7c02SPekka Enberg static void *virtio_net_rx_thread(void *p)
954f56d42cSAsias He {
964f56d42cSAsias He 	struct iovec iov[VIRTIO_NET_QUEUE_SIZE];
974f56d42cSAsias He 	struct virt_queue *vq;
9843835ac9SSasha Levin 	struct kvm *kvm;
999a6d73f1SSasha Levin 	struct net_dev *ndev = p;
1003fdf659dSSasha Levin 	u16 out, in;
1013fdf659dSSasha Levin 	u16 head;
1026d6cc14bSWill Deacon 	int len, copied;
1036585ffb7SSasha Levin 	u32 id;
1046585ffb7SSasha Levin 
1056585ffb7SSasha Levin 	mutex_lock(&ndev->mutex);
1066585ffb7SSasha Levin 	id = ndev->rx_vqs++ * 2;
1076585ffb7SSasha Levin 	mutex_unlock(&ndev->mutex);
1084f56d42cSAsias He 
109a4d8c55eSSasha Levin 	kvm__set_thread_name("virtio-net-rx");
110a4d8c55eSSasha Levin 
1119a6d73f1SSasha Levin 	kvm = ndev->kvm;
1126585ffb7SSasha Levin 	vq = &ndev->vqs[id];
113c4aa7c02SPekka Enberg 
114c4aa7c02SPekka Enberg 	while (1) {
1156585ffb7SSasha Levin 		mutex_lock(&ndev->io_lock[id]);
116c4aa7c02SPekka Enberg 		if (!virt_queue__available(vq))
1176585ffb7SSasha Levin 			pthread_cond_wait(&ndev->io_cond[id], &ndev->io_lock[id].mutex);
1186585ffb7SSasha Levin 		mutex_unlock(&ndev->io_lock[id]);
1194f56d42cSAsias He 
1204f56d42cSAsias He 		while (virt_queue__available(vq)) {
1217668c3a6SSasha Levin 			unsigned char buffer[MAX_PACKET_SIZE + sizeof(struct virtio_net_hdr_mrg_rxbuf)];
1227668c3a6SSasha Levin 			struct iovec dummy_iov = {
1237668c3a6SSasha Levin 				.iov_base = buffer,
1247668c3a6SSasha Levin 				.iov_len  = sizeof(buffer),
1257668c3a6SSasha Levin 			};
1267668c3a6SSasha Levin 			struct virtio_net_hdr_mrg_rxbuf *hdr;
127*8ed60bbeSMarc Zyngier 			int i;
1287f5ffaf5SAsias He 
1297668c3a6SSasha Levin 			len = ndev->ops->rx(&dummy_iov, 1, ndev);
1306d6cc14bSWill Deacon 			if (len < 0) {
1316d6cc14bSWill Deacon 				pr_warning("%s: rx on vq %u failed (%d), exiting thread\n",
1326d6cc14bSWill Deacon 						__func__, id, len);
1336d6cc14bSWill Deacon 				goto out_err;
1346d6cc14bSWill Deacon 			}
1356d6cc14bSWill Deacon 
136*8ed60bbeSMarc Zyngier 			copied = i = 0;
1377668c3a6SSasha Levin 			head = virt_queue__get_iov(vq, iov, &out, &in, kvm);
138*8ed60bbeSMarc Zyngier 			hdr = iov[0].iov_base;
1397668c3a6SSasha Levin 			while (copied < len) {
1406d6cc14bSWill Deacon 				size_t iovsize = min_t(size_t, len - copied, iov_size(iov, in));
1417668c3a6SSasha Levin 
142e2493047SAsias He 				memcpy_toiovec(iov, buffer + copied, iovsize);
1437668c3a6SSasha Levin 				copied += iovsize;
144*8ed60bbeSMarc Zyngier 				if (i++ == 0)
145*8ed60bbeSMarc Zyngier 					virtio_net_fix_rx_hdr(hdr, ndev);
146*8ed60bbeSMarc Zyngier 				if (has_virtio_feature(ndev, VIRTIO_NET_F_MRG_RXBUF)) {
147*8ed60bbeSMarc Zyngier 					u16 num_buffers = virtio_guest_to_host_u16(vq, hdr->num_buffers);
148*8ed60bbeSMarc Zyngier 					hdr->num_buffers = virtio_host_to_guest_u16(vq, num_buffers + 1);
149*8ed60bbeSMarc Zyngier 				}
1507668c3a6SSasha Levin 				virt_queue__set_used_elem(vq, head, iovsize);
1517668c3a6SSasha Levin 				if (copied == len)
1527668c3a6SSasha Levin 					break;
1537668c3a6SSasha Levin 				while (!virt_queue__available(vq))
1547668c3a6SSasha Levin 					sleep(0);
1557668c3a6SSasha Levin 				head = virt_queue__get_iov(vq, iov, &out, &in, kvm);
1567668c3a6SSasha Levin 			}
157c4aa7c02SPekka Enberg 			/* We should interrupt guest right now, otherwise latency is huge. */
1586585ffb7SSasha Levin 			if (virtio_queue__should_signal(vq))
1596585ffb7SSasha Levin 				ndev->vdev.ops->signal_vq(kvm, &ndev->vdev, id);
1604f56d42cSAsias He 		}
161c4aa7c02SPekka Enberg 	}
162c4aa7c02SPekka Enberg 
1636d6cc14bSWill Deacon out_err:
164c4aa7c02SPekka Enberg 	pthread_exit(NULL);
165c4aa7c02SPekka Enberg 	return NULL;
166c4aa7c02SPekka Enberg 
167c4aa7c02SPekka Enberg }
168c4aa7c02SPekka Enberg 
169c4aa7c02SPekka Enberg static void *virtio_net_tx_thread(void *p)
1704f56d42cSAsias He {
1714f56d42cSAsias He 	struct iovec iov[VIRTIO_NET_QUEUE_SIZE];
1724f56d42cSAsias He 	struct virt_queue *vq;
17343835ac9SSasha Levin 	struct kvm *kvm;
1749a6d73f1SSasha Levin 	struct net_dev *ndev = p;
1753fdf659dSSasha Levin 	u16 out, in;
1763fdf659dSSasha Levin 	u16 head;
1774f56d42cSAsias He 	int len;
1786585ffb7SSasha Levin 	u32 id;
1796585ffb7SSasha Levin 
1806585ffb7SSasha Levin 	mutex_lock(&ndev->mutex);
1816585ffb7SSasha Levin 	id = ndev->tx_vqs++ * 2 + 1;
1826585ffb7SSasha Levin 	mutex_unlock(&ndev->mutex);
1834f56d42cSAsias He 
184a4d8c55eSSasha Levin 	kvm__set_thread_name("virtio-net-tx");
185a4d8c55eSSasha Levin 
1869a6d73f1SSasha Levin 	kvm = ndev->kvm;
1876585ffb7SSasha Levin 	vq = &ndev->vqs[id];
188c4aa7c02SPekka Enberg 
189c4aa7c02SPekka Enberg 	while (1) {
1906585ffb7SSasha Levin 		mutex_lock(&ndev->io_lock[id]);
191c4aa7c02SPekka Enberg 		if (!virt_queue__available(vq))
1926585ffb7SSasha Levin 			pthread_cond_wait(&ndev->io_cond[id], &ndev->io_lock[id].mutex);
1936585ffb7SSasha Levin 		mutex_unlock(&ndev->io_lock[id]);
1944f56d42cSAsias He 
1954f56d42cSAsias He 		while (virt_queue__available(vq)) {
196*8ed60bbeSMarc Zyngier 			struct virtio_net_hdr *hdr;
19743835ac9SSasha Levin 			head = virt_queue__get_iov(vq, iov, &out, &in, kvm);
198*8ed60bbeSMarc Zyngier 			hdr = iov[0].iov_base;
199*8ed60bbeSMarc Zyngier 			virtio_net_fix_tx_hdr(hdr, ndev);
2009a6d73f1SSasha Levin 			len = ndev->ops->tx(iov, out, ndev);
2016d6cc14bSWill Deacon 			if (len < 0) {
2026d6cc14bSWill Deacon 				pr_warning("%s: tx on vq %u failed (%d)\n",
203*8ed60bbeSMarc Zyngier 						__func__, id, errno);
2046d6cc14bSWill Deacon 				goto out_err;
2056d6cc14bSWill Deacon 			}
2066d6cc14bSWill Deacon 
2074f56d42cSAsias He 			virt_queue__set_used_elem(vq, head, len);
2084f56d42cSAsias He 		}
2094f56d42cSAsias He 
2106585ffb7SSasha Levin 		if (virtio_queue__should_signal(vq))
2116585ffb7SSasha Levin 			ndev->vdev.ops->signal_vq(kvm, &ndev->vdev, id);
2124f56d42cSAsias He 	}
2134f56d42cSAsias He 
2146d6cc14bSWill Deacon out_err:
215c4aa7c02SPekka Enberg 	pthread_exit(NULL);
216c4aa7c02SPekka Enberg 	return NULL;
217c4aa7c02SPekka Enberg }
218407475bfSPekka Enberg 
2196585ffb7SSasha Levin static virtio_net_ctrl_ack virtio_net_handle_mq(struct kvm* kvm, struct net_dev *ndev, struct virtio_net_ctrl_hdr *ctrl)
2206585ffb7SSasha Levin {
2216585ffb7SSasha Levin 	/* Not much to do here */
2226585ffb7SSasha Levin 	return VIRTIO_NET_OK;
2236585ffb7SSasha Levin }
2246585ffb7SSasha Levin 
2256585ffb7SSasha Levin static void *virtio_net_ctrl_thread(void *p)
226abd4a801SSasha Levin {
227abd4a801SSasha Levin 	struct iovec iov[VIRTIO_NET_QUEUE_SIZE];
228abd4a801SSasha Levin 	u16 out, in, head;
2296585ffb7SSasha Levin 	struct net_dev *ndev = p;
2306585ffb7SSasha Levin 	struct kvm *kvm = ndev->kvm;
23179052597SSasha Levin 	u32 id = ndev->queue_pairs * 2;
2326585ffb7SSasha Levin 	struct virt_queue *vq = &ndev->vqs[id];
233abd4a801SSasha Levin 	struct virtio_net_ctrl_hdr *ctrl;
234abd4a801SSasha Levin 	virtio_net_ctrl_ack *ack;
235abd4a801SSasha Levin 
2366585ffb7SSasha Levin 	while (1) {
2376585ffb7SSasha Levin 		mutex_lock(&ndev->io_lock[id]);
2386585ffb7SSasha Levin 		if (!virt_queue__available(vq))
2396585ffb7SSasha Levin 			pthread_cond_wait(&ndev->io_cond[id], &ndev->io_lock[id].mutex);
2406585ffb7SSasha Levin 		mutex_unlock(&ndev->io_lock[id]);
2416585ffb7SSasha Levin 
2426585ffb7SSasha Levin 		while (virt_queue__available(vq)) {
2436585ffb7SSasha Levin 			head = virt_queue__get_iov(&ndev->vqs[id], iov, &out, &in, kvm);
244abd4a801SSasha Levin 			ctrl = iov[0].iov_base;
245abd4a801SSasha Levin 			ack = iov[out].iov_base;
246abd4a801SSasha Levin 
247abd4a801SSasha Levin 			switch (ctrl->class) {
2486585ffb7SSasha Levin 			case VIRTIO_NET_CTRL_MQ:
2496585ffb7SSasha Levin 				*ack = virtio_net_handle_mq(kvm, ndev, ctrl);
2506585ffb7SSasha Levin 				break;
251abd4a801SSasha Levin 			default:
252abd4a801SSasha Levin 				*ack = VIRTIO_NET_ERR;
253abd4a801SSasha Levin 				break;
254abd4a801SSasha Levin 			}
2556585ffb7SSasha Levin 			virt_queue__set_used_elem(&ndev->vqs[id], head, iov[out].iov_len);
2566585ffb7SSasha Levin 		}
257abd4a801SSasha Levin 
2586585ffb7SSasha Levin 		if (virtio_queue__should_signal(&ndev->vqs[id]))
2596585ffb7SSasha Levin 			ndev->vdev.ops->signal_vq(kvm, &ndev->vdev, id);
2606585ffb7SSasha Levin 	}
261abd4a801SSasha Levin 
2626585ffb7SSasha Levin 	pthread_exit(NULL);
263abd4a801SSasha Levin 
2646585ffb7SSasha Levin 	return NULL;
265abd4a801SSasha Levin }
266abd4a801SSasha Levin 
2679a6d73f1SSasha Levin static void virtio_net_handle_callback(struct kvm *kvm, struct net_dev *ndev, int queue)
2684f56d42cSAsias He {
26979052597SSasha Levin 	if ((u32)queue >= (ndev->queue_pairs * 2 + 1)) {
2709a6d73f1SSasha Levin 		pr_warning("Unknown queue index %u", queue);
2716585ffb7SSasha Levin 		return;
272c4aa7c02SPekka Enberg 	}
2736585ffb7SSasha Levin 
2746585ffb7SSasha Levin 	mutex_lock(&ndev->io_lock[queue]);
2756585ffb7SSasha Levin 	pthread_cond_signal(&ndev->io_cond[queue]);
2766585ffb7SSasha Levin 	mutex_unlock(&ndev->io_lock[queue]);
2774f56d42cSAsias He }
2784f56d42cSAsias He 
2798c0ae74dSSasha Levin static bool virtio_net__tap_init(struct net_dev *ndev)
2804f56d42cSAsias He {
281cb7202c1SSasha Levin 	int sock = socket(AF_INET, SOCK_STREAM, 0);
282f715177dSAsias He 	int pid, status, offload, hdr_len;
283cb7202c1SSasha Levin 	struct sockaddr_in sin = {0};
284246c8347SAsias He 	struct ifreq ifr;
2858c0ae74dSSasha Levin 	const struct virtio_net_params *params = ndev->params;
2861dfc7c24SMarc Zyngier 	bool skipconf = !!params->tapif;
2874f56d42cSAsias He 
288f19edd1eSSasha Levin 	/* Did the user already gave us the FD? */
289f19edd1eSSasha Levin 	if (params->fd) {
290f19edd1eSSasha Levin 		ndev->tap_fd = params->fd;
291f19edd1eSSasha Levin 		return 1;
292f19edd1eSSasha Levin 	}
293f19edd1eSSasha Levin 
2949a6d73f1SSasha Levin 	ndev->tap_fd = open("/dev/net/tun", O_RDWR);
2959a6d73f1SSasha Levin 	if (ndev->tap_fd < 0) {
2964542f276SCyrill Gorcunov 		pr_warning("Unable to open /dev/net/tun");
2973b02f580SSasha Levin 		goto fail;
2983b02f580SSasha Levin 	}
2994f56d42cSAsias He 
3004f56d42cSAsias He 	memset(&ifr, 0, sizeof(ifr));
301246c8347SAsias He 	ifr.ifr_flags = IFF_TAP | IFF_NO_PI | IFF_VNET_HDR;
3021dfc7c24SMarc Zyngier 	if (params->tapif)
3031dfc7c24SMarc Zyngier 		strncpy(ifr.ifr_name, params->tapif, sizeof(ifr.ifr_name));
3049a6d73f1SSasha Levin 	if (ioctl(ndev->tap_fd, TUNSETIFF, &ifr) < 0) {
3054542f276SCyrill Gorcunov 		pr_warning("Config tap device error. Are you root?");
3063b02f580SSasha Levin 		goto fail;
3073b02f580SSasha Levin 	}
3084f56d42cSAsias He 
3099a6d73f1SSasha Levin 	strncpy(ndev->tap_name, ifr.ifr_name, sizeof(ndev->tap_name));
3104f56d42cSAsias He 
3119a6d73f1SSasha Levin 	if (ioctl(ndev->tap_fd, TUNSETNOCSUM, 1) < 0) {
3124542f276SCyrill Gorcunov 		pr_warning("Config tap device TUNSETNOCSUM error");
313246c8347SAsias He 		goto fail;
314246c8347SAsias He 	}
315246c8347SAsias He 
3167668c3a6SSasha Levin 	hdr_len = has_virtio_feature(ndev, VIRTIO_NET_F_MRG_RXBUF) ?
31748c6b47aSSasha Levin 			sizeof(struct virtio_net_hdr_mrg_rxbuf) :
31848c6b47aSSasha Levin 			sizeof(struct virtio_net_hdr);
3199a6d73f1SSasha Levin 	if (ioctl(ndev->tap_fd, TUNSETVNETHDRSZ, &hdr_len) < 0)
3204542f276SCyrill Gorcunov 		pr_warning("Config tap device TUNSETVNETHDRSZ error");
321246c8347SAsias He 
322246c8347SAsias He 	offload = TUN_F_CSUM | TUN_F_TSO4 | TUN_F_TSO6 | TUN_F_UFO;
3239a6d73f1SSasha Levin 	if (ioctl(ndev->tap_fd, TUNSETOFFLOAD, offload) < 0) {
3244542f276SCyrill Gorcunov 		pr_warning("Config tap device TUNSETOFFLOAD error");
325246c8347SAsias He 		goto fail;
326246c8347SAsias He 	}
3274f56d42cSAsias He 
32873b7d038SAmos Kong 	if (strcmp(params->script, "none")) {
32973b7d038SAmos Kong 		pid = fork();
33073b7d038SAmos Kong 		if (pid == 0) {
3319a6d73f1SSasha Levin 			execl(params->script, params->script, ndev->tap_name, NULL);
33273b7d038SAmos Kong 			_exit(1);
33373b7d038SAmos Kong 		} else {
33473b7d038SAmos Kong 			waitpid(pid, &status, 0);
33573b7d038SAmos Kong 			if (WIFEXITED(status) && WEXITSTATUS(status) != 0) {
3364542f276SCyrill Gorcunov 				pr_warning("Fail to setup tap by %s", params->script);
33773b7d038SAmos Kong 				goto fail;
33873b7d038SAmos Kong 			}
33973b7d038SAmos Kong 		}
3401dfc7c24SMarc Zyngier 	} else if (!skipconf) {
341cb7202c1SSasha Levin 		memset(&ifr, 0, sizeof(ifr));
3429a6d73f1SSasha Levin 		strncpy(ifr.ifr_name, ndev->tap_name, sizeof(ndev->tap_name));
343bdfcfca6SSasha Levin 		sin.sin_addr.s_addr = inet_addr(params->host_ip);
344cb7202c1SSasha Levin 		memcpy(&(ifr.ifr_addr), &sin, sizeof(ifr.ifr_addr));
345cb7202c1SSasha Levin 		ifr.ifr_addr.sa_family = AF_INET;
3463b02f580SSasha Levin 		if (ioctl(sock, SIOCSIFADDR, &ifr) < 0) {
3474542f276SCyrill Gorcunov 			pr_warning("Could not set ip address on tap device");
3483b02f580SSasha Levin 			goto fail;
3493b02f580SSasha Levin 		}
35073b7d038SAmos Kong 	}
351cb7202c1SSasha Levin 
3521dfc7c24SMarc Zyngier 	if (!skipconf) {
353cb7202c1SSasha Levin 		memset(&ifr, 0, sizeof(ifr));
3549a6d73f1SSasha Levin 		strncpy(ifr.ifr_name, ndev->tap_name, sizeof(ndev->tap_name));
355cb7202c1SSasha Levin 		ioctl(sock, SIOCGIFFLAGS, &ifr);
356cb7202c1SSasha Levin 		ifr.ifr_flags |= IFF_UP | IFF_RUNNING;
357cb7202c1SSasha Levin 		if (ioctl(sock, SIOCSIFFLAGS, &ifr) < 0)
3584542f276SCyrill Gorcunov 			pr_warning("Could not bring tap device up");
3591dfc7c24SMarc Zyngier 	}
360cb7202c1SSasha Levin 
361cb7202c1SSasha Levin 	close(sock);
3623b02f580SSasha Levin 
3633b02f580SSasha Levin 	return 1;
3643b02f580SSasha Levin 
3653b02f580SSasha Levin fail:
3663b02f580SSasha Levin 	if (sock >= 0)
3673b02f580SSasha Levin 		close(sock);
3689a6d73f1SSasha Levin 	if (ndev->tap_fd >= 0)
3699a6d73f1SSasha Levin 		close(ndev->tap_fd);
3703b02f580SSasha Levin 
3713b02f580SSasha Levin 	return 0;
3724f56d42cSAsias He }
3734f56d42cSAsias He 
374b4fdde6dSAsias He static inline int tap_ops_tx(struct iovec *iov, u16 out, struct net_dev *ndev)
375b4fdde6dSAsias He {
376b4fdde6dSAsias He 	return writev(ndev->tap_fd, iov, out);
377b4fdde6dSAsias He }
378b4fdde6dSAsias He 
379b4fdde6dSAsias He static inline int tap_ops_rx(struct iovec *iov, u16 in, struct net_dev *ndev)
380b4fdde6dSAsias He {
381b4fdde6dSAsias He 	return readv(ndev->tap_fd, iov, in);
382b4fdde6dSAsias He }
383b4fdde6dSAsias He 
384b4fdde6dSAsias He static inline int uip_ops_tx(struct iovec *iov, u16 out, struct net_dev *ndev)
385b4fdde6dSAsias He {
386b4fdde6dSAsias He 	return uip_tx(iov, out, &ndev->info);
387b4fdde6dSAsias He }
388b4fdde6dSAsias He 
389b4fdde6dSAsias He static inline int uip_ops_rx(struct iovec *iov, u16 in, struct net_dev *ndev)
390b4fdde6dSAsias He {
391b4fdde6dSAsias He 	return uip_rx(iov, in, &ndev->info);
392b4fdde6dSAsias He }
393b4fdde6dSAsias He 
394b4fdde6dSAsias He static struct net_dev_operations tap_ops = {
395b4fdde6dSAsias He 	.rx	= tap_ops_rx,
396b4fdde6dSAsias He 	.tx	= tap_ops_tx,
397b4fdde6dSAsias He };
398b4fdde6dSAsias He 
399b4fdde6dSAsias He static struct net_dev_operations uip_ops = {
400b4fdde6dSAsias He 	.rx	= uip_ops_rx,
401b4fdde6dSAsias He 	.tx	= uip_ops_tx,
402b4fdde6dSAsias He };
403b4fdde6dSAsias He 
404c5ae742bSSasha Levin static u8 *get_config(struct kvm *kvm, void *dev)
40578a2a3e2SSasha Levin {
40678a2a3e2SSasha Levin 	struct net_dev *ndev = dev;
40778a2a3e2SSasha Levin 
408c5ae742bSSasha Levin 	return ((u8 *)(&ndev->config));
40978a2a3e2SSasha Levin }
41078a2a3e2SSasha Levin 
41178a2a3e2SSasha Levin static u32 get_host_features(struct kvm *kvm, void *dev)
41278a2a3e2SSasha Levin {
41379052597SSasha Levin 	struct net_dev *ndev = dev;
41479052597SSasha Levin 
41578a2a3e2SSasha Levin 	return 1UL << VIRTIO_NET_F_MAC
41678a2a3e2SSasha Levin 		| 1UL << VIRTIO_NET_F_CSUM
41778a2a3e2SSasha Levin 		| 1UL << VIRTIO_NET_F_HOST_UFO
41878a2a3e2SSasha Levin 		| 1UL << VIRTIO_NET_F_HOST_TSO4
41978a2a3e2SSasha Levin 		| 1UL << VIRTIO_NET_F_HOST_TSO6
42078a2a3e2SSasha Levin 		| 1UL << VIRTIO_NET_F_GUEST_UFO
42178a2a3e2SSasha Levin 		| 1UL << VIRTIO_NET_F_GUEST_TSO4
42292c1f37bSSasha Levin 		| 1UL << VIRTIO_NET_F_GUEST_TSO6
423754c8ce3SSasha Levin 		| 1UL << VIRTIO_RING_F_EVENT_IDX
424abd4a801SSasha Levin 		| 1UL << VIRTIO_RING_F_INDIRECT_DESC
4256585ffb7SSasha Levin 		| 1UL << VIRTIO_NET_F_CTRL_VQ
4267668c3a6SSasha Levin 		| 1UL << VIRTIO_NET_F_MRG_RXBUF
42779052597SSasha Levin 		| 1UL << (ndev->queue_pairs > 1 ? VIRTIO_NET_F_MQ : 0);
42878a2a3e2SSasha Levin }
42978a2a3e2SSasha Levin 
43015636d5eSYing-Shiuan Pan static int virtio_net__vhost_set_features(struct net_dev *ndev)
43115636d5eSYing-Shiuan Pan {
43215636d5eSYing-Shiuan Pan 	u64 features = 1UL << VIRTIO_RING_F_EVENT_IDX;
43315636d5eSYing-Shiuan Pan 	u64 vhost_features;
43415636d5eSYing-Shiuan Pan 
43515636d5eSYing-Shiuan Pan 	if (ioctl(ndev->vhost_fd, VHOST_GET_FEATURES, &vhost_features) != 0)
43615636d5eSYing-Shiuan Pan 		die_perror("VHOST_GET_FEATURES failed");
43715636d5eSYing-Shiuan Pan 
43815636d5eSYing-Shiuan Pan 	/* make sure both side support mergable rx buffers */
43915636d5eSYing-Shiuan Pan 	if (vhost_features & 1UL << VIRTIO_NET_F_MRG_RXBUF &&
44015636d5eSYing-Shiuan Pan 			has_virtio_feature(ndev, VIRTIO_NET_F_MRG_RXBUF))
44115636d5eSYing-Shiuan Pan 		features |= 1UL << VIRTIO_NET_F_MRG_RXBUF;
44215636d5eSYing-Shiuan Pan 
44315636d5eSYing-Shiuan Pan 	return ioctl(ndev->vhost_fd, VHOST_SET_FEATURES, &features);
44415636d5eSYing-Shiuan Pan }
44515636d5eSYing-Shiuan Pan 
44678a2a3e2SSasha Levin static void set_guest_features(struct kvm *kvm, void *dev, u32 features)
44778a2a3e2SSasha Levin {
44878a2a3e2SSasha Levin 	struct net_dev *ndev = dev;
449*8ed60bbeSMarc Zyngier 	struct virtio_net_config *conf = &ndev->config;
45078a2a3e2SSasha Levin 
45178a2a3e2SSasha Levin 	ndev->features = features;
4528aa155c4SYing-Shiuan Pan 
453*8ed60bbeSMarc Zyngier 	conf->status = virtio_host_to_guest_u16(&ndev->vdev, conf->status);
454*8ed60bbeSMarc Zyngier 	conf->max_virtqueue_pairs = virtio_host_to_guest_u16(&ndev->vdev,
455*8ed60bbeSMarc Zyngier 							     conf->max_virtqueue_pairs);
456*8ed60bbeSMarc Zyngier 
4578aa155c4SYing-Shiuan Pan 	if (ndev->mode == NET_MODE_TAP) {
4588aa155c4SYing-Shiuan Pan 		if (!virtio_net__tap_init(ndev))
4598aa155c4SYing-Shiuan Pan 			die_perror("You have requested a TAP device, but creation of one has failed because");
46015636d5eSYing-Shiuan Pan 		if (ndev->vhost_fd &&
46115636d5eSYing-Shiuan Pan 				virtio_net__vhost_set_features(ndev) != 0)
46215636d5eSYing-Shiuan Pan 			die_perror("VHOST_SET_FEATURES failed");
4638aa155c4SYing-Shiuan Pan 	} else {
4648aa155c4SYing-Shiuan Pan 		ndev->info.vnet_hdr_len = has_virtio_feature(ndev, VIRTIO_NET_F_MRG_RXBUF) ?
4658aa155c4SYing-Shiuan Pan 						sizeof(struct virtio_net_hdr_mrg_rxbuf) :
4668aa155c4SYing-Shiuan Pan 						sizeof(struct virtio_net_hdr);
4678aa155c4SYing-Shiuan Pan 		uip_init(&ndev->info);
4688aa155c4SYing-Shiuan Pan 	}
46978a2a3e2SSasha Levin }
47078a2a3e2SSasha Levin 
4719e56ec14SSasha Levin static bool is_ctrl_vq(struct net_dev *ndev, u32 vq)
4729e56ec14SSasha Levin {
4739e56ec14SSasha Levin 	return vq == (u32)(ndev->queue_pairs * 2);
4749e56ec14SSasha Levin }
4759e56ec14SSasha Levin 
476c59ba304SWill Deacon static int init_vq(struct kvm *kvm, void *dev, u32 vq, u32 page_size, u32 align,
477c59ba304SWill Deacon 		   u32 pfn)
47878a2a3e2SSasha Levin {
4799ed67cdcSSasha Levin 	struct vhost_vring_state state = { .index = vq };
4809ed67cdcSSasha Levin 	struct vhost_vring_addr addr;
48178a2a3e2SSasha Levin 	struct net_dev *ndev = dev;
48278a2a3e2SSasha Levin 	struct virt_queue *queue;
48378a2a3e2SSasha Levin 	void *p;
4849ed67cdcSSasha Levin 	int r;
48578a2a3e2SSasha Levin 
486312c62d1SSasha Levin 	compat__remove_message(compat_id);
48778a2a3e2SSasha Levin 
48878a2a3e2SSasha Levin 	queue		= &ndev->vqs[vq];
48978a2a3e2SSasha Levin 	queue->pfn	= pfn;
490e7e2950aSSasha Levin 	p		= virtio_get_vq(kvm, queue->pfn, page_size);
49178a2a3e2SSasha Levin 
492c59ba304SWill Deacon 	vring_init(&queue->vring, VIRTIO_NET_QUEUE_SIZE, p, align);
493*8ed60bbeSMarc Zyngier 	virtio_init_device_vq(&ndev->vdev, queue);
49478a2a3e2SSasha Levin 
4956585ffb7SSasha Levin 	mutex_init(&ndev->io_lock[vq]);
4966585ffb7SSasha Levin 	pthread_cond_init(&ndev->io_cond[vq], NULL);
4979e56ec14SSasha Levin 	if (is_ctrl_vq(ndev, vq)) {
4986585ffb7SSasha Levin 		pthread_create(&ndev->io_thread[vq], NULL, virtio_net_ctrl_thread, ndev);
4999e56ec14SSasha Levin 
5009e56ec14SSasha Levin 		return 0;
5019e56ec14SSasha Levin 	} else if (ndev->vhost_fd == 0 ) {
5029e56ec14SSasha Levin 		if (vq & 1)
5036585ffb7SSasha Levin 			pthread_create(&ndev->io_thread[vq], NULL, virtio_net_tx_thread, ndev);
5046585ffb7SSasha Levin 		else
5056585ffb7SSasha Levin 			pthread_create(&ndev->io_thread[vq], NULL, virtio_net_rx_thread, ndev);
5066585ffb7SSasha Levin 
50778a2a3e2SSasha Levin 		return 0;
5086585ffb7SSasha Levin 	}
5099ed67cdcSSasha Levin 
510*8ed60bbeSMarc Zyngier 	if (queue->endian != VIRTIO_ENDIAN_HOST)
511*8ed60bbeSMarc Zyngier 		die_perror("VHOST requires VIRTIO_ENDIAN_HOST");
512*8ed60bbeSMarc Zyngier 
5139ed67cdcSSasha Levin 	state.num = queue->vring.num;
5149ed67cdcSSasha Levin 	r = ioctl(ndev->vhost_fd, VHOST_SET_VRING_NUM, &state);
5159ed67cdcSSasha Levin 	if (r < 0)
5169ed67cdcSSasha Levin 		die_perror("VHOST_SET_VRING_NUM failed");
5179ed67cdcSSasha Levin 	state.num = 0;
5189ed67cdcSSasha Levin 	r = ioctl(ndev->vhost_fd, VHOST_SET_VRING_BASE, &state);
5199ed67cdcSSasha Levin 	if (r < 0)
5209ed67cdcSSasha Levin 		die_perror("VHOST_SET_VRING_BASE failed");
5219ed67cdcSSasha Levin 
5229ed67cdcSSasha Levin 	addr = (struct vhost_vring_addr) {
5239ed67cdcSSasha Levin 		.index = vq,
5249ed67cdcSSasha Levin 		.desc_user_addr = (u64)(unsigned long)queue->vring.desc,
5259ed67cdcSSasha Levin 		.avail_user_addr = (u64)(unsigned long)queue->vring.avail,
5269ed67cdcSSasha Levin 		.used_user_addr = (u64)(unsigned long)queue->vring.used,
5279ed67cdcSSasha Levin 	};
5289ed67cdcSSasha Levin 
5299ed67cdcSSasha Levin 	r = ioctl(ndev->vhost_fd, VHOST_SET_VRING_ADDR, &addr);
5309ed67cdcSSasha Levin 	if (r < 0)
5319ed67cdcSSasha Levin 		die_perror("VHOST_SET_VRING_ADDR failed");
5329ed67cdcSSasha Levin 
5339ed67cdcSSasha Levin 	return 0;
5349ed67cdcSSasha Levin }
5359ed67cdcSSasha Levin 
5369ed67cdcSSasha Levin static void notify_vq_gsi(struct kvm *kvm, void *dev, u32 vq, u32 gsi)
5379ed67cdcSSasha Levin {
5389ed67cdcSSasha Levin 	struct net_dev *ndev = dev;
5399ed67cdcSSasha Levin 	struct kvm_irqfd irq;
5409ed67cdcSSasha Levin 	struct vhost_vring_file file;
5419ed67cdcSSasha Levin 	int r;
5429ed67cdcSSasha Levin 
5439ed67cdcSSasha Levin 	if (ndev->vhost_fd == 0)
5449ed67cdcSSasha Levin 		return;
5459ed67cdcSSasha Levin 
5469ed67cdcSSasha Levin 	irq = (struct kvm_irqfd) {
5479ed67cdcSSasha Levin 		.gsi	= gsi,
5489ed67cdcSSasha Levin 		.fd	= eventfd(0, 0),
5499ed67cdcSSasha Levin 	};
5509ed67cdcSSasha Levin 	file = (struct vhost_vring_file) {
5519ed67cdcSSasha Levin 		.index	= vq,
5529ed67cdcSSasha Levin 		.fd	= irq.fd,
5539ed67cdcSSasha Levin 	};
5549ed67cdcSSasha Levin 
5559ed67cdcSSasha Levin 	r = ioctl(kvm->vm_fd, KVM_IRQFD, &irq);
5569ed67cdcSSasha Levin 	if (r < 0)
5579ed67cdcSSasha Levin 		die_perror("KVM_IRQFD failed");
5589ed67cdcSSasha Levin 
5599ed67cdcSSasha Levin 	r = ioctl(ndev->vhost_fd, VHOST_SET_VRING_CALL, &file);
5609ed67cdcSSasha Levin 	if (r < 0)
5619ed67cdcSSasha Levin 		die_perror("VHOST_SET_VRING_CALL failed");
5629ed67cdcSSasha Levin 	file.fd = ndev->tap_fd;
5639ed67cdcSSasha Levin 	r = ioctl(ndev->vhost_fd, VHOST_NET_SET_BACKEND, &file);
5649ed67cdcSSasha Levin 	if (r != 0)
5659ed67cdcSSasha Levin 		die("VHOST_NET_SET_BACKEND failed %d", errno);
5669ed67cdcSSasha Levin 
5679ed67cdcSSasha Levin }
5689ed67cdcSSasha Levin 
5699ed67cdcSSasha Levin static void notify_vq_eventfd(struct kvm *kvm, void *dev, u32 vq, u32 efd)
5709ed67cdcSSasha Levin {
5719ed67cdcSSasha Levin 	struct net_dev *ndev = dev;
5729ed67cdcSSasha Levin 	struct vhost_vring_file file = {
5739ed67cdcSSasha Levin 		.index	= vq,
5749ed67cdcSSasha Levin 		.fd	= efd,
5759ed67cdcSSasha Levin 	};
5769ed67cdcSSasha Levin 	int r;
5779ed67cdcSSasha Levin 
5789e56ec14SSasha Levin 	if (ndev->vhost_fd == 0 || is_ctrl_vq(ndev, vq))
5799ed67cdcSSasha Levin 		return;
5809ed67cdcSSasha Levin 
5819ed67cdcSSasha Levin 	r = ioctl(ndev->vhost_fd, VHOST_SET_VRING_KICK, &file);
5829ed67cdcSSasha Levin 	if (r < 0)
5839ed67cdcSSasha Levin 		die_perror("VHOST_SET_VRING_KICK failed");
58478a2a3e2SSasha Levin }
58578a2a3e2SSasha Levin 
58678a2a3e2SSasha Levin static int notify_vq(struct kvm *kvm, void *dev, u32 vq)
58778a2a3e2SSasha Levin {
5889a6d73f1SSasha Levin 	struct net_dev *ndev = dev;
5899a6d73f1SSasha Levin 
5909a6d73f1SSasha Levin 	virtio_net_handle_callback(kvm, ndev, vq);
59178a2a3e2SSasha Levin 
59278a2a3e2SSasha Levin 	return 0;
59378a2a3e2SSasha Levin }
59478a2a3e2SSasha Levin 
59578a2a3e2SSasha Levin static int get_pfn_vq(struct kvm *kvm, void *dev, u32 vq)
59678a2a3e2SSasha Levin {
59778a2a3e2SSasha Levin 	struct net_dev *ndev = dev;
59878a2a3e2SSasha Levin 
59978a2a3e2SSasha Levin 	return ndev->vqs[vq].pfn;
60078a2a3e2SSasha Levin }
60178a2a3e2SSasha Levin 
60278a2a3e2SSasha Levin static int get_size_vq(struct kvm *kvm, void *dev, u32 vq)
60378a2a3e2SSasha Levin {
6040f4f51a8SAsias He 	/* FIXME: dynamic */
60578a2a3e2SSasha Levin 	return VIRTIO_NET_QUEUE_SIZE;
60678a2a3e2SSasha Levin }
60778a2a3e2SSasha Levin 
6080f4f51a8SAsias He static int set_size_vq(struct kvm *kvm, void *dev, u32 vq, int size)
6090f4f51a8SAsias He {
6100f4f51a8SAsias He 	/* FIXME: dynamic */
6110f4f51a8SAsias He 	return size;
6120f4f51a8SAsias He }
6130f4f51a8SAsias He 
6141c47ce69SSasha Levin static struct virtio_ops net_dev_virtio_ops = (struct virtio_ops) {
6151c47ce69SSasha Levin 	.get_config		= get_config,
6161c47ce69SSasha Levin 	.get_host_features	= get_host_features,
6171c47ce69SSasha Levin 	.set_guest_features	= set_guest_features,
6181c47ce69SSasha Levin 	.init_vq		= init_vq,
6191c47ce69SSasha Levin 	.get_pfn_vq		= get_pfn_vq,
6201c47ce69SSasha Levin 	.get_size_vq		= get_size_vq,
6210f4f51a8SAsias He 	.set_size_vq		= set_size_vq,
6220f4f51a8SAsias He 	.notify_vq		= notify_vq,
6239ed67cdcSSasha Levin 	.notify_vq_gsi		= notify_vq_gsi,
6249ed67cdcSSasha Levin 	.notify_vq_eventfd	= notify_vq_eventfd,
6251c47ce69SSasha Levin };
6261c47ce69SSasha Levin 
6279ed67cdcSSasha Levin static void virtio_net__vhost_init(struct kvm *kvm, struct net_dev *ndev)
6289ed67cdcSSasha Levin {
6299ed67cdcSSasha Levin 	struct vhost_memory *mem;
6309ed67cdcSSasha Levin 	int r;
6319ed67cdcSSasha Levin 
6329ed67cdcSSasha Levin 	ndev->vhost_fd = open("/dev/vhost-net", O_RDWR);
6339ed67cdcSSasha Levin 	if (ndev->vhost_fd < 0)
6349ed67cdcSSasha Levin 		die_perror("Failed openning vhost-net device");
6359ed67cdcSSasha Levin 
6368b795457SAsias He 	mem = calloc(1, sizeof(*mem) + sizeof(struct vhost_memory_region));
6379ed67cdcSSasha Levin 	if (mem == NULL)
6389ed67cdcSSasha Levin 		die("Failed allocating memory for vhost memory map");
6399ed67cdcSSasha Levin 
6409ed67cdcSSasha Levin 	mem->nregions = 1;
6419ed67cdcSSasha Levin 	mem->regions[0] = (struct vhost_memory_region) {
6429ed67cdcSSasha Levin 		.guest_phys_addr	= 0,
6439ed67cdcSSasha Levin 		.memory_size		= kvm->ram_size,
644b4108023SAsias He 		.userspace_addr		= (unsigned long)kvm->ram_start,
6459ed67cdcSSasha Levin 	};
6469ed67cdcSSasha Levin 
6479ed67cdcSSasha Levin 	r = ioctl(ndev->vhost_fd, VHOST_SET_OWNER);
6489ed67cdcSSasha Levin 	if (r != 0)
6499ed67cdcSSasha Levin 		die_perror("VHOST_SET_OWNER failed");
6509ed67cdcSSasha Levin 
6519ed67cdcSSasha Levin 	r = ioctl(ndev->vhost_fd, VHOST_SET_MEM_TABLE, mem);
6529ed67cdcSSasha Levin 	if (r != 0)
6539ed67cdcSSasha Levin 		die_perror("VHOST_SET_MEM_TABLE failed");
654627d6874SAsias He 
655627d6874SAsias He 	ndev->vdev.use_vhost = true;
656627d6874SAsias He 
6579ed67cdcSSasha Levin 	free(mem);
6589ed67cdcSSasha Levin }
6599ed67cdcSSasha Levin 
6605f225124SSasha Levin static inline void str_to_mac(const char *str, char *mac)
6615f225124SSasha Levin {
6625f225124SSasha Levin 	sscanf(str, "%hhx:%hhx:%hhx:%hhx:%hhx:%hhx",
6635f225124SSasha Levin 		mac, mac+1, mac+2, mac+3, mac+4, mac+5);
6645f225124SSasha Levin }
6654346fd8fSSasha Levin static int set_net_param(struct kvm *kvm, struct virtio_net_params *p,
6664346fd8fSSasha Levin 			const char *param, const char *val)
6675f225124SSasha Levin {
6685f225124SSasha Levin 	if (strcmp(param, "guest_mac") == 0) {
6695f225124SSasha Levin 		str_to_mac(val, p->guest_mac);
6705f225124SSasha Levin 	} else if (strcmp(param, "mode") == 0) {
6715f225124SSasha Levin 		if (!strncmp(val, "user", 4)) {
6725f225124SSasha Levin 			int i;
6735f225124SSasha Levin 
6745f225124SSasha Levin 			for (i = 0; i < kvm->cfg.num_net_devices; i++)
6755f225124SSasha Levin 				if (kvm->cfg.net_params[i].mode == NET_MODE_USER)
6765f225124SSasha Levin 					die("Only one usermode network device allowed at a time");
6775f225124SSasha Levin 			p->mode = NET_MODE_USER;
6785f225124SSasha Levin 		} else if (!strncmp(val, "tap", 3)) {
6795f225124SSasha Levin 			p->mode = NET_MODE_TAP;
6805f225124SSasha Levin 		} else if (!strncmp(val, "none", 4)) {
6815f225124SSasha Levin 			kvm->cfg.no_net = 1;
6825f225124SSasha Levin 			return -1;
6835f225124SSasha Levin 		} else
6845f225124SSasha Levin 			die("Unknown network mode %s, please use user, tap or none", kvm->cfg.network);
6855f225124SSasha Levin 	} else if (strcmp(param, "script") == 0) {
6865f225124SSasha Levin 		p->script = strdup(val);
6875f225124SSasha Levin 	} else if (strcmp(param, "guest_ip") == 0) {
6885f225124SSasha Levin 		p->guest_ip = strdup(val);
6895f225124SSasha Levin 	} else if (strcmp(param, "host_ip") == 0) {
6905f225124SSasha Levin 		p->host_ip = strdup(val);
6915f225124SSasha Levin 	} else if (strcmp(param, "trans") == 0) {
6925f225124SSasha Levin 		p->trans = strdup(val);
6931dfc7c24SMarc Zyngier 	} else if (strcmp(param, "tapif") == 0) {
6941dfc7c24SMarc Zyngier 		p->tapif = strdup(val);
6955f225124SSasha Levin 	} else if (strcmp(param, "vhost") == 0) {
6965f225124SSasha Levin 		p->vhost = atoi(val);
6975f225124SSasha Levin 	} else if (strcmp(param, "fd") == 0) {
6985f225124SSasha Levin 		p->fd = atoi(val);
69979052597SSasha Levin 	} else if (strcmp(param, "mq") == 0) {
70079052597SSasha Levin 		p->mq = atoi(val);
7015f225124SSasha Levin 	} else
7025f225124SSasha Levin 		die("Unknown network parameter %s", param);
7035f225124SSasha Levin 
7045f225124SSasha Levin 	return 0;
7055f225124SSasha Levin }
7065f225124SSasha Levin 
7075f225124SSasha Levin int netdev_parser(const struct option *opt, const char *arg, int unset)
7085f225124SSasha Levin {
7095f225124SSasha Levin 	struct virtio_net_params p;
7105f225124SSasha Levin 	char *buf = NULL, *cmd = NULL, *cur = NULL;
7115f225124SSasha Levin 	bool on_cmd = true;
7125f225124SSasha Levin 	struct kvm *kvm = opt->ptr;
7135f225124SSasha Levin 
7145f225124SSasha Levin 	if (arg) {
7155f225124SSasha Levin 		buf = strdup(arg);
7165f225124SSasha Levin 		if (buf == NULL)
7175f225124SSasha Levin 			die("Failed allocating new net buffer");
7185f225124SSasha Levin 		cur = strtok(buf, ",=");
7195f225124SSasha Levin 	}
7205f225124SSasha Levin 
7215f225124SSasha Levin 	p = (struct virtio_net_params) {
7225f225124SSasha Levin 		.guest_ip	= DEFAULT_GUEST_ADDR,
7235f225124SSasha Levin 		.host_ip	= DEFAULT_HOST_ADDR,
7245f225124SSasha Levin 		.script		= DEFAULT_SCRIPT,
7255f225124SSasha Levin 		.mode		= NET_MODE_TAP,
7265f225124SSasha Levin 	};
7275f225124SSasha Levin 
7285f225124SSasha Levin 	str_to_mac(DEFAULT_GUEST_MAC, p.guest_mac);
7295f225124SSasha Levin 	p.guest_mac[5] += kvm->cfg.num_net_devices;
7305f225124SSasha Levin 
7315f225124SSasha Levin 	while (cur) {
7325f225124SSasha Levin 		if (on_cmd) {
7335f225124SSasha Levin 			cmd = cur;
7345f225124SSasha Levin 		} else {
7354346fd8fSSasha Levin 			if (set_net_param(kvm, &p, cmd, cur) < 0)
7365f225124SSasha Levin 				goto done;
7375f225124SSasha Levin 		}
7385f225124SSasha Levin 		on_cmd = !on_cmd;
7395f225124SSasha Levin 
7405f225124SSasha Levin 		cur = strtok(NULL, ",=");
7415f225124SSasha Levin 	};
7425f225124SSasha Levin 
7435f225124SSasha Levin 	kvm->cfg.num_net_devices++;
7445f225124SSasha Levin 
7455f225124SSasha Levin 	kvm->cfg.net_params = realloc(kvm->cfg.net_params, kvm->cfg.num_net_devices * sizeof(*kvm->cfg.net_params));
7465f225124SSasha Levin 	if (kvm->cfg.net_params == NULL)
7475f225124SSasha Levin 		die("Failed adding new network device");
7485f225124SSasha Levin 
7495f225124SSasha Levin 	kvm->cfg.net_params[kvm->cfg.num_net_devices - 1] = p;
7505f225124SSasha Levin 
7515f225124SSasha Levin done:
7525f225124SSasha Levin 	free(buf);
7535f225124SSasha Levin 	return 0;
7545f225124SSasha Levin }
7555f225124SSasha Levin 
7565f225124SSasha Levin static int virtio_net__init_one(struct virtio_net_params *params)
7574f56d42cSAsias He {
75876a4aac6SWill Deacon 	int i, err;
7599a6d73f1SSasha Levin 	struct net_dev *ndev;
76076a4aac6SWill Deacon 	struct virtio_ops *ops;
7619a6d73f1SSasha Levin 
7629a6d73f1SSasha Levin 	ndev = calloc(1, sizeof(struct net_dev));
7639a6d73f1SSasha Levin 	if (ndev == NULL)
7645f225124SSasha Levin 		return -ENOMEM;
7659a6d73f1SSasha Levin 
76676a4aac6SWill Deacon 	ops = malloc(sizeof(*ops));
76776a4aac6SWill Deacon 	if (ops == NULL) {
76876a4aac6SWill Deacon 		err = -ENOMEM;
76976a4aac6SWill Deacon 		goto err_free_ndev;
77076a4aac6SWill Deacon 	}
77176a4aac6SWill Deacon 
7729a6d73f1SSasha Levin 	list_add_tail(&ndev->list, &ndevs);
7739a6d73f1SSasha Levin 
7749a6d73f1SSasha Levin 	ndev->kvm = params->kvm;
7758c0ae74dSSasha Levin 	ndev->params = params;
7769a6d73f1SSasha Levin 
7779a6d73f1SSasha Levin 	mutex_init(&ndev->mutex);
77879052597SSasha Levin 	ndev->queue_pairs = max(1, min(VIRTIO_NET_NUM_QUEUES, params->mq));
7799a6d73f1SSasha Levin 	ndev->config.status = VIRTIO_NET_S_LINK_UP;
78079052597SSasha Levin 	if (ndev->queue_pairs > 1)
78179052597SSasha Levin 		ndev->config.max_virtqueue_pairs = ndev->queue_pairs;
78279052597SSasha Levin 
7830c54698eSAsias He 	for (i = 0 ; i < 6 ; i++) {
7849a6d73f1SSasha Levin 		ndev->config.mac[i]		= params->guest_mac[i];
7859a6d73f1SSasha Levin 		ndev->info.guest_mac.addr[i]	= params->guest_mac[i];
7869a6d73f1SSasha Levin 		ndev->info.host_mac.addr[i]	= params->host_mac[i];
7870c54698eSAsias He 	}
788f715177dSAsias He 
7899a6d73f1SSasha Levin 	ndev->mode = params->mode;
7909a6d73f1SSasha Levin 	if (ndev->mode == NET_MODE_TAP) {
7919a6d73f1SSasha Levin 		ndev->ops = &tap_ops;
792b4fdde6dSAsias He 	} else {
7939a6d73f1SSasha Levin 		ndev->info.host_ip		= ntohl(inet_addr(params->host_ip));
7949a6d73f1SSasha Levin 		ndev->info.guest_ip		= ntohl(inet_addr(params->guest_ip));
7959a6d73f1SSasha Levin 		ndev->info.guest_netmask	= ntohl(inet_addr("255.255.255.0"));
7969a6d73f1SSasha Levin 		ndev->info.buf_nr		= 20,
7979a6d73f1SSasha Levin 		ndev->ops = &uip_ops;
7985f3aaf22SMarc Zyngier 		uip_static_init(&ndev->info);
799b4fdde6dSAsias He 	}
800b5ee1ea7SAsias He 
80176a4aac6SWill Deacon 	*ops = net_dev_virtio_ops;
80269205aa1SAsias He 	if (params->trans && strcmp(params->trans, "mmio") == 0)
80376a4aac6SWill Deacon 		virtio_init(params->kvm, ndev, &ndev->vdev, ops, VIRTIO_MMIO,
80476a4aac6SWill Deacon 			    PCI_DEVICE_ID_VIRTIO_NET, VIRTIO_ID_NET, PCI_CLASS_NET);
80569205aa1SAsias He 	else
80676a4aac6SWill Deacon 		virtio_init(params->kvm, ndev, &ndev->vdev, ops, VIRTIO_PCI,
80776a4aac6SWill Deacon 			    PCI_DEVICE_ID_VIRTIO_NET, VIRTIO_ID_NET, PCI_CLASS_NET);
80827ab67f5SSasha Levin 
8099ed67cdcSSasha Levin 	if (params->vhost)
8109ed67cdcSSasha Levin 		virtio_net__vhost_init(params->kvm, ndev);
811cb83de6fSSasha Levin 
812d278197dSAsias He 	if (compat_id == -1)
81352f34d2cSAsias He 		compat_id = virtio_compat_add_message("virtio-net", "CONFIG_VIRTIO_NET");
8145f225124SSasha Levin 
8155f225124SSasha Levin 	return 0;
81676a4aac6SWill Deacon 
81776a4aac6SWill Deacon err_free_ndev:
81876a4aac6SWill Deacon 	free(ndev);
81976a4aac6SWill Deacon 	return err;
8205f225124SSasha Levin }
8215f225124SSasha Levin 
8225f225124SSasha Levin int virtio_net__init(struct kvm *kvm)
8235f225124SSasha Levin {
8245f225124SSasha Levin 	int i;
8255f225124SSasha Levin 
8265f225124SSasha Levin 	for (i = 0; i < kvm->cfg.num_net_devices; i++) {
8275f225124SSasha Levin 		kvm->cfg.net_params[i].kvm = kvm;
8285f225124SSasha Levin 		virtio_net__init_one(&kvm->cfg.net_params[i]);
8295f225124SSasha Levin 	}
8305f225124SSasha Levin 
8315f225124SSasha Levin 	if (kvm->cfg.num_net_devices == 0 && kvm->cfg.no_net == 0) {
8328c0ae74dSSasha Levin 		static struct virtio_net_params net_params;
8335f225124SSasha Levin 
8345f225124SSasha Levin 		net_params = (struct virtio_net_params) {
8355f225124SSasha Levin 			.guest_ip	= kvm->cfg.guest_ip,
8365f225124SSasha Levin 			.host_ip	= kvm->cfg.host_ip,
8375f225124SSasha Levin 			.kvm		= kvm,
8385f225124SSasha Levin 			.script		= kvm->cfg.script,
8395f225124SSasha Levin 			.mode		= NET_MODE_USER,
8405f225124SSasha Levin 		};
8415f225124SSasha Levin 		str_to_mac(kvm->cfg.guest_mac, net_params.guest_mac);
8425f225124SSasha Levin 		str_to_mac(kvm->cfg.host_mac, net_params.host_mac);
8435f225124SSasha Levin 
8445f225124SSasha Levin 		virtio_net__init_one(&net_params);
8455f225124SSasha Levin 	}
8465f225124SSasha Levin 
8475f225124SSasha Levin 	return 0;
8485f225124SSasha Levin }
84949a8afd1SSasha Levin virtio_dev_init(virtio_net__init);
8505f225124SSasha Levin 
8515f225124SSasha Levin int virtio_net__exit(struct kvm *kvm)
8525f225124SSasha Levin {
8535f225124SSasha Levin 	return 0;
8544f56d42cSAsias He }
85549a8afd1SSasha Levin virtio_dev_exit(virtio_net__exit);
856