xref: /kvmtool/virtio/net.c (revision ad96e8676bfac56bcacaa3cb602e7107fb7a99fd)
131638bcaSCyrill Gorcunov #include "kvm/virtio-pci-dev.h"
2b5ee1ea7SAsias He #include "kvm/virtio-net.h"
34f56d42cSAsias He #include "kvm/virtio.h"
44f56d42cSAsias He #include "kvm/mutex.h"
54f56d42cSAsias He #include "kvm/util.h"
64f56d42cSAsias He #include "kvm/kvm.h"
72449f6e3SSasha Levin #include "kvm/irq.h"
8b5ee1ea7SAsias He #include "kvm/uip.h"
9cb83de6fSSasha Levin #include "kvm/guest_compat.h"
107668c3a6SSasha Levin #include "kvm/iovec.h"
114f56d42cSAsias He 
129ed67cdcSSasha Levin #include <linux/vhost.h>
134f56d42cSAsias He #include <linux/virtio_net.h>
144f56d42cSAsias He #include <linux/if_tun.h>
1578a2a3e2SSasha Levin #include <linux/types.h>
16c229370aSIngo Molnar 
17c229370aSIngo Molnar #include <arpa/inet.h>
184f56d42cSAsias He #include <net/if.h>
19c229370aSIngo Molnar 
20c229370aSIngo Molnar #include <unistd.h>
214f56d42cSAsias He #include <fcntl.h>
22c229370aSIngo Molnar 
23cb7202c1SSasha Levin #include <sys/socket.h>
24c229370aSIngo Molnar #include <sys/ioctl.h>
25c229370aSIngo Molnar #include <sys/types.h>
2673b7d038SAmos Kong #include <sys/wait.h>
279ed67cdcSSasha Levin #include <sys/eventfd.h>
284f56d42cSAsias He 
294059ad8bSAsias He #define VIRTIO_NET_QUEUE_SIZE		256
306585ffb7SSasha Levin #define VIRTIO_NET_NUM_QUEUES		8
314f56d42cSAsias He 
32b4fdde6dSAsias He struct net_dev;
33b4fdde6dSAsias He 
34b4fdde6dSAsias He struct net_dev_operations {
35b4fdde6dSAsias He 	int (*rx)(struct iovec *iov, u16 in, struct net_dev *ndev);
36b4fdde6dSAsias He 	int (*tx)(struct iovec *iov, u16 in, struct net_dev *ndev);
37b4fdde6dSAsias He };
38b4fdde6dSAsias He 
39*ad96e867SJean-Philippe Brucker struct net_dev_queue {
40*ad96e867SJean-Philippe Brucker 	int				id;
41*ad96e867SJean-Philippe Brucker 	struct net_dev			*ndev;
42*ad96e867SJean-Philippe Brucker 	struct virt_queue		vq;
43*ad96e867SJean-Philippe Brucker 	pthread_t			thread;
44*ad96e867SJean-Philippe Brucker 	struct mutex			lock;
45*ad96e867SJean-Philippe Brucker 	pthread_cond_t			cond;
46*ad96e867SJean-Philippe Brucker };
47*ad96e867SJean-Philippe Brucker 
488626798bSAsias He struct net_dev {
49d3476f7dSSasha Levin 	struct mutex			mutex;
5002eca50cSAsias He 	struct virtio_device		vdev;
519a6d73f1SSasha Levin 	struct list_head		list;
524f56d42cSAsias He 
53*ad96e867SJean-Philippe Brucker 	struct net_dev_queue		queues[VIRTIO_NET_NUM_QUEUES * 2 + 1];
54c229370aSIngo Molnar 	struct virtio_net_config	config;
55*ad96e867SJean-Philippe Brucker 	u32				features, queue_pairs;
56c4aa7c02SPekka Enberg 
579ed67cdcSSasha Levin 	int				vhost_fd;
584f56d42cSAsias He 	int				tap_fd;
594f56d42cSAsias He 	char				tap_name[IFNAMSIZ];
6059ee54ebSWei Chen 	bool				tap_ufo;
61bb1a32f1SAsias He 
62bb1a32f1SAsias He 	int				mode;
63bb1a32f1SAsias He 
64b5ee1ea7SAsias He 	struct uip_info			info;
65b4fdde6dSAsias He 	struct net_dev_operations	*ops;
669a6d73f1SSasha Levin 	struct kvm			*kvm;
678c0ae74dSSasha Levin 
688c0ae74dSSasha Levin 	struct virtio_net_params	*params;
694f56d42cSAsias He };
704f56d42cSAsias He 
719a6d73f1SSasha Levin static LIST_HEAD(ndevs);
72312c62d1SSasha Levin static int compat_id = -1;
734f56d42cSAsias He 
747668c3a6SSasha Levin #define MAX_PACKET_SIZE 65550
757668c3a6SSasha Levin 
767668c3a6SSasha Levin static bool has_virtio_feature(struct net_dev *ndev, u32 feature)
777668c3a6SSasha Levin {
787668c3a6SSasha Levin 	return ndev->features & (1 << feature);
797668c3a6SSasha Levin }
807668c3a6SSasha Levin 
818ed60bbeSMarc Zyngier static void virtio_net_fix_tx_hdr(struct virtio_net_hdr *hdr, struct net_dev *ndev)
828ed60bbeSMarc Zyngier {
838ed60bbeSMarc Zyngier 	hdr->hdr_len		= virtio_guest_to_host_u16(&ndev->vdev, hdr->hdr_len);
848ed60bbeSMarc Zyngier 	hdr->gso_size		= virtio_guest_to_host_u16(&ndev->vdev, hdr->gso_size);
858ed60bbeSMarc Zyngier 	hdr->csum_start		= virtio_guest_to_host_u16(&ndev->vdev, hdr->csum_start);
868ed60bbeSMarc Zyngier 	hdr->csum_offset	= virtio_guest_to_host_u16(&ndev->vdev, hdr->csum_offset);
878ed60bbeSMarc Zyngier }
888ed60bbeSMarc Zyngier 
893fea89a9SWill Deacon static void virtio_net_fix_rx_hdr(struct virtio_net_hdr *hdr, struct net_dev *ndev)
908ed60bbeSMarc Zyngier {
913fea89a9SWill Deacon 	hdr->hdr_len		= virtio_host_to_guest_u16(&ndev->vdev, hdr->hdr_len);
923fea89a9SWill Deacon 	hdr->gso_size		= virtio_host_to_guest_u16(&ndev->vdev, hdr->gso_size);
933fea89a9SWill Deacon 	hdr->csum_start		= virtio_host_to_guest_u16(&ndev->vdev, hdr->csum_start);
943fea89a9SWill Deacon 	hdr->csum_offset	= virtio_host_to_guest_u16(&ndev->vdev, hdr->csum_offset);
958ed60bbeSMarc Zyngier }
968ed60bbeSMarc Zyngier 
97c4aa7c02SPekka Enberg static void *virtio_net_rx_thread(void *p)
984f56d42cSAsias He {
994f56d42cSAsias He 	struct iovec iov[VIRTIO_NET_QUEUE_SIZE];
100*ad96e867SJean-Philippe Brucker 	struct net_dev_queue *queue = p;
101*ad96e867SJean-Philippe Brucker 	struct virt_queue *vq = &queue->vq;
102*ad96e867SJean-Philippe Brucker 	struct net_dev *ndev = queue->ndev;
10343835ac9SSasha Levin 	struct kvm *kvm;
1043fdf659dSSasha Levin 	u16 out, in;
1053fdf659dSSasha Levin 	u16 head;
1066d6cc14bSWill Deacon 	int len, copied;
1074f56d42cSAsias He 
108a4d8c55eSSasha Levin 	kvm__set_thread_name("virtio-net-rx");
109a4d8c55eSSasha Levin 
1109a6d73f1SSasha Levin 	kvm = ndev->kvm;
111c4aa7c02SPekka Enberg 	while (1) {
112*ad96e867SJean-Philippe Brucker 		mutex_lock(&queue->lock);
113c4aa7c02SPekka Enberg 		if (!virt_queue__available(vq))
114*ad96e867SJean-Philippe Brucker 			pthread_cond_wait(&queue->cond, &queue->lock.mutex);
115*ad96e867SJean-Philippe Brucker 		mutex_unlock(&queue->lock);
1164f56d42cSAsias He 
1174f56d42cSAsias He 		while (virt_queue__available(vq)) {
1187668c3a6SSasha Levin 			unsigned char buffer[MAX_PACKET_SIZE + sizeof(struct virtio_net_hdr_mrg_rxbuf)];
1197668c3a6SSasha Levin 			struct iovec dummy_iov = {
1207668c3a6SSasha Levin 				.iov_base = buffer,
1217668c3a6SSasha Levin 				.iov_len  = sizeof(buffer),
1227668c3a6SSasha Levin 			};
1237668c3a6SSasha Levin 			struct virtio_net_hdr_mrg_rxbuf *hdr;
1243fea89a9SWill Deacon 			u16 num_buffers;
1257f5ffaf5SAsias He 
1267668c3a6SSasha Levin 			len = ndev->ops->rx(&dummy_iov, 1, ndev);
1276d6cc14bSWill Deacon 			if (len < 0) {
1286d6cc14bSWill Deacon 				pr_warning("%s: rx on vq %u failed (%d), exiting thread\n",
129*ad96e867SJean-Philippe Brucker 						__func__, queue->id, len);
1306d6cc14bSWill Deacon 				goto out_err;
1316d6cc14bSWill Deacon 			}
1326d6cc14bSWill Deacon 
1333fea89a9SWill Deacon 			copied = num_buffers = 0;
1347668c3a6SSasha Levin 			head = virt_queue__get_iov(vq, iov, &out, &in, kvm);
1358ed60bbeSMarc Zyngier 			hdr = iov[0].iov_base;
1367668c3a6SSasha Levin 			while (copied < len) {
1376d6cc14bSWill Deacon 				size_t iovsize = min_t(size_t, len - copied, iov_size(iov, in));
1387668c3a6SSasha Levin 
139e2493047SAsias He 				memcpy_toiovec(iov, buffer + copied, iovsize);
1407668c3a6SSasha Levin 				copied += iovsize;
1413fea89a9SWill Deacon 				virt_queue__set_used_elem_no_update(vq, head, iovsize, num_buffers++);
1427668c3a6SSasha Levin 				if (copied == len)
1437668c3a6SSasha Levin 					break;
1447668c3a6SSasha Levin 				while (!virt_queue__available(vq))
1457668c3a6SSasha Levin 					sleep(0);
1467668c3a6SSasha Levin 				head = virt_queue__get_iov(vq, iov, &out, &in, kvm);
1477668c3a6SSasha Levin 			}
1483fea89a9SWill Deacon 
1493fea89a9SWill Deacon 			virtio_net_fix_rx_hdr(&hdr->hdr, ndev);
1503fea89a9SWill Deacon 			if (has_virtio_feature(ndev, VIRTIO_NET_F_MRG_RXBUF))
1513fea89a9SWill Deacon 				hdr->num_buffers = virtio_host_to_guest_u16(vq, num_buffers);
1523fea89a9SWill Deacon 
1533fea89a9SWill Deacon 			virt_queue__used_idx_advance(vq, num_buffers);
1543fea89a9SWill Deacon 
155c4aa7c02SPekka Enberg 			/* We should interrupt guest right now, otherwise latency is huge. */
1566585ffb7SSasha Levin 			if (virtio_queue__should_signal(vq))
157*ad96e867SJean-Philippe Brucker 				ndev->vdev.ops->signal_vq(kvm, &ndev->vdev, queue->id);
1584f56d42cSAsias He 		}
159c4aa7c02SPekka Enberg 	}
160c4aa7c02SPekka Enberg 
1616d6cc14bSWill Deacon out_err:
162c4aa7c02SPekka Enberg 	pthread_exit(NULL);
163c4aa7c02SPekka Enberg 	return NULL;
164c4aa7c02SPekka Enberg 
165c4aa7c02SPekka Enberg }
166c4aa7c02SPekka Enberg 
167c4aa7c02SPekka Enberg static void *virtio_net_tx_thread(void *p)
1684f56d42cSAsias He {
1694f56d42cSAsias He 	struct iovec iov[VIRTIO_NET_QUEUE_SIZE];
170*ad96e867SJean-Philippe Brucker 	struct net_dev_queue *queue = p;
171*ad96e867SJean-Philippe Brucker 	struct virt_queue *vq = &queue->vq;
172*ad96e867SJean-Philippe Brucker 	struct net_dev *ndev = queue->ndev;
17343835ac9SSasha Levin 	struct kvm *kvm;
1743fdf659dSSasha Levin 	u16 out, in;
1753fdf659dSSasha Levin 	u16 head;
1764f56d42cSAsias He 	int len;
1774f56d42cSAsias He 
178a4d8c55eSSasha Levin 	kvm__set_thread_name("virtio-net-tx");
179a4d8c55eSSasha Levin 
1809a6d73f1SSasha Levin 	kvm = ndev->kvm;
181c4aa7c02SPekka Enberg 
182c4aa7c02SPekka Enberg 	while (1) {
183*ad96e867SJean-Philippe Brucker 		mutex_lock(&queue->lock);
184c4aa7c02SPekka Enberg 		if (!virt_queue__available(vq))
185*ad96e867SJean-Philippe Brucker 			pthread_cond_wait(&queue->cond, &queue->lock.mutex);
186*ad96e867SJean-Philippe Brucker 		mutex_unlock(&queue->lock);
1874f56d42cSAsias He 
1884f56d42cSAsias He 		while (virt_queue__available(vq)) {
1898ed60bbeSMarc Zyngier 			struct virtio_net_hdr *hdr;
19043835ac9SSasha Levin 			head = virt_queue__get_iov(vq, iov, &out, &in, kvm);
1918ed60bbeSMarc Zyngier 			hdr = iov[0].iov_base;
1928ed60bbeSMarc Zyngier 			virtio_net_fix_tx_hdr(hdr, ndev);
1939a6d73f1SSasha Levin 			len = ndev->ops->tx(iov, out, ndev);
1946d6cc14bSWill Deacon 			if (len < 0) {
1956d6cc14bSWill Deacon 				pr_warning("%s: tx on vq %u failed (%d)\n",
196*ad96e867SJean-Philippe Brucker 						__func__, queue->id, errno);
1976d6cc14bSWill Deacon 				goto out_err;
1986d6cc14bSWill Deacon 			}
1996d6cc14bSWill Deacon 
2004f56d42cSAsias He 			virt_queue__set_used_elem(vq, head, len);
2014f56d42cSAsias He 		}
2024f56d42cSAsias He 
2036585ffb7SSasha Levin 		if (virtio_queue__should_signal(vq))
204*ad96e867SJean-Philippe Brucker 			ndev->vdev.ops->signal_vq(kvm, &ndev->vdev, queue->id);
2054f56d42cSAsias He 	}
2064f56d42cSAsias He 
2076d6cc14bSWill Deacon out_err:
208c4aa7c02SPekka Enberg 	pthread_exit(NULL);
209c4aa7c02SPekka Enberg 	return NULL;
210c4aa7c02SPekka Enberg }
211407475bfSPekka Enberg 
2126585ffb7SSasha Levin static virtio_net_ctrl_ack virtio_net_handle_mq(struct kvm* kvm, struct net_dev *ndev, struct virtio_net_ctrl_hdr *ctrl)
2136585ffb7SSasha Levin {
2146585ffb7SSasha Levin 	/* Not much to do here */
2156585ffb7SSasha Levin 	return VIRTIO_NET_OK;
2166585ffb7SSasha Levin }
2176585ffb7SSasha Levin 
2186585ffb7SSasha Levin static void *virtio_net_ctrl_thread(void *p)
219abd4a801SSasha Levin {
220abd4a801SSasha Levin 	struct iovec iov[VIRTIO_NET_QUEUE_SIZE];
221*ad96e867SJean-Philippe Brucker 	struct net_dev_queue *queue = p;
222*ad96e867SJean-Philippe Brucker 	struct virt_queue *vq = &queue->vq;
223*ad96e867SJean-Philippe Brucker 	struct net_dev *ndev = queue->ndev;
224abd4a801SSasha Levin 	u16 out, in, head;
2256585ffb7SSasha Levin 	struct kvm *kvm = ndev->kvm;
226abd4a801SSasha Levin 	struct virtio_net_ctrl_hdr *ctrl;
227abd4a801SSasha Levin 	virtio_net_ctrl_ack *ack;
228abd4a801SSasha Levin 
229edb4a8a0SSuzuki K. Poulose 	kvm__set_thread_name("virtio-net-ctrl");
230edb4a8a0SSuzuki K. Poulose 
2316585ffb7SSasha Levin 	while (1) {
232*ad96e867SJean-Philippe Brucker 		mutex_lock(&queue->lock);
2336585ffb7SSasha Levin 		if (!virt_queue__available(vq))
234*ad96e867SJean-Philippe Brucker 			pthread_cond_wait(&queue->cond, &queue->lock.mutex);
235*ad96e867SJean-Philippe Brucker 		mutex_unlock(&queue->lock);
2366585ffb7SSasha Levin 
2376585ffb7SSasha Levin 		while (virt_queue__available(vq)) {
238*ad96e867SJean-Philippe Brucker 			head = virt_queue__get_iov(vq, iov, &out, &in, kvm);
239abd4a801SSasha Levin 			ctrl = iov[0].iov_base;
240abd4a801SSasha Levin 			ack = iov[out].iov_base;
241abd4a801SSasha Levin 
242abd4a801SSasha Levin 			switch (ctrl->class) {
2436585ffb7SSasha Levin 			case VIRTIO_NET_CTRL_MQ:
2446585ffb7SSasha Levin 				*ack = virtio_net_handle_mq(kvm, ndev, ctrl);
2456585ffb7SSasha Levin 				break;
246abd4a801SSasha Levin 			default:
247abd4a801SSasha Levin 				*ack = VIRTIO_NET_ERR;
248abd4a801SSasha Levin 				break;
249abd4a801SSasha Levin 			}
250*ad96e867SJean-Philippe Brucker 			virt_queue__set_used_elem(vq, head, iov[out].iov_len);
2516585ffb7SSasha Levin 		}
252abd4a801SSasha Levin 
253*ad96e867SJean-Philippe Brucker 		if (virtio_queue__should_signal(vq))
254*ad96e867SJean-Philippe Brucker 			ndev->vdev.ops->signal_vq(kvm, &ndev->vdev, queue->id);
2556585ffb7SSasha Levin 	}
256abd4a801SSasha Levin 
2576585ffb7SSasha Levin 	pthread_exit(NULL);
258abd4a801SSasha Levin 
2596585ffb7SSasha Levin 	return NULL;
260abd4a801SSasha Levin }
261abd4a801SSasha Levin 
2629a6d73f1SSasha Levin static void virtio_net_handle_callback(struct kvm *kvm, struct net_dev *ndev, int queue)
2634f56d42cSAsias He {
264*ad96e867SJean-Philippe Brucker 	struct net_dev_queue *net_queue = &ndev->queues[queue];
265*ad96e867SJean-Philippe Brucker 
26679052597SSasha Levin 	if ((u32)queue >= (ndev->queue_pairs * 2 + 1)) {
2679a6d73f1SSasha Levin 		pr_warning("Unknown queue index %u", queue);
2686585ffb7SSasha Levin 		return;
269c4aa7c02SPekka Enberg 	}
2706585ffb7SSasha Levin 
271*ad96e867SJean-Philippe Brucker 	mutex_lock(&net_queue->lock);
272*ad96e867SJean-Philippe Brucker 	pthread_cond_signal(&net_queue->cond);
273*ad96e867SJean-Philippe Brucker 	mutex_unlock(&net_queue->lock);
2744f56d42cSAsias He }
2754f56d42cSAsias He 
276d2a7ddffSMarc Zyngier static int virtio_net_request_tap(struct net_dev *ndev, struct ifreq *ifr,
277d2a7ddffSMarc Zyngier 				  const char *tapname)
278d2a7ddffSMarc Zyngier {
279d2a7ddffSMarc Zyngier 	int ret;
280d2a7ddffSMarc Zyngier 
281d2a7ddffSMarc Zyngier 	memset(ifr, 0, sizeof(*ifr));
282d2a7ddffSMarc Zyngier 	ifr->ifr_flags = IFF_TAP | IFF_NO_PI | IFF_VNET_HDR;
283d2a7ddffSMarc Zyngier 	if (tapname)
284d2a7ddffSMarc Zyngier 		strncpy(ifr->ifr_name, tapname, sizeof(ifr->ifr_name));
285d2a7ddffSMarc Zyngier 
286f83dc816SAndreas Herrmann 	ret = ioctl(ndev->tap_fd, TUNSETIFF, ifr);
287d2a7ddffSMarc Zyngier 
288d2a7ddffSMarc Zyngier 	if (ret >= 0)
289d2a7ddffSMarc Zyngier 		strncpy(ndev->tap_name, ifr->ifr_name, sizeof(ndev->tap_name));
290d2a7ddffSMarc Zyngier 	return ret;
291d2a7ddffSMarc Zyngier }
292d2a7ddffSMarc Zyngier 
293eef27ae3SFan Du static int virtio_net_exec_script(const char* script, const char *tap_name)
294eef27ae3SFan Du {
295eef27ae3SFan Du 	pid_t pid;
296eef27ae3SFan Du 	int status;
297eef27ae3SFan Du 
298eef27ae3SFan Du 	pid = fork();
299eef27ae3SFan Du 	if (pid == 0) {
300eef27ae3SFan Du 		execl(script, script, tap_name, NULL);
301eef27ae3SFan Du 		_exit(1);
302eef27ae3SFan Du 	} else {
303eef27ae3SFan Du 		waitpid(pid, &status, 0);
304eef27ae3SFan Du 		if (WIFEXITED(status) && WEXITSTATUS(status) != 0) {
305eef27ae3SFan Du 			pr_warning("Fail to setup tap by %s", script);
306eef27ae3SFan Du 			return -1;
307eef27ae3SFan Du 		}
308eef27ae3SFan Du 	}
309eef27ae3SFan Du 	return 0;
310eef27ae3SFan Du }
311eef27ae3SFan Du 
3128c0ae74dSSasha Levin static bool virtio_net__tap_init(struct net_dev *ndev)
3134f56d42cSAsias He {
314cb7202c1SSasha Levin 	int sock = socket(AF_INET, SOCK_STREAM, 0);
31559ee54ebSWei Chen 	int hdr_len;
316cb7202c1SSasha Levin 	struct sockaddr_in sin = {0};
317246c8347SAsias He 	struct ifreq ifr;
3188c0ae74dSSasha Levin 	const struct virtio_net_params *params = ndev->params;
3191dfc7c24SMarc Zyngier 	bool skipconf = !!params->tapif;
3204f56d42cSAsias He 
3217668c3a6SSasha Levin 	hdr_len = has_virtio_feature(ndev, VIRTIO_NET_F_MRG_RXBUF) ?
32248c6b47aSSasha Levin 			sizeof(struct virtio_net_hdr_mrg_rxbuf) :
32348c6b47aSSasha Levin 			sizeof(struct virtio_net_hdr);
3249a6d73f1SSasha Levin 	if (ioctl(ndev->tap_fd, TUNSETVNETHDRSZ, &hdr_len) < 0)
3254542f276SCyrill Gorcunov 		pr_warning("Config tap device TUNSETVNETHDRSZ error");
326246c8347SAsias He 
32773b7d038SAmos Kong 	if (strcmp(params->script, "none")) {
328eef27ae3SFan Du 		if (virtio_net_exec_script(params->script, ndev->tap_name) < 0)
32973b7d038SAmos Kong 			goto fail;
3301dfc7c24SMarc Zyngier 	} else if (!skipconf) {
331cb7202c1SSasha Levin 		memset(&ifr, 0, sizeof(ifr));
3329a6d73f1SSasha Levin 		strncpy(ifr.ifr_name, ndev->tap_name, sizeof(ndev->tap_name));
333bdfcfca6SSasha Levin 		sin.sin_addr.s_addr = inet_addr(params->host_ip);
334cb7202c1SSasha Levin 		memcpy(&(ifr.ifr_addr), &sin, sizeof(ifr.ifr_addr));
335cb7202c1SSasha Levin 		ifr.ifr_addr.sa_family = AF_INET;
3363b02f580SSasha Levin 		if (ioctl(sock, SIOCSIFADDR, &ifr) < 0) {
3374542f276SCyrill Gorcunov 			pr_warning("Could not set ip address on tap device");
3383b02f580SSasha Levin 			goto fail;
3393b02f580SSasha Levin 		}
34073b7d038SAmos Kong 	}
341cb7202c1SSasha Levin 
3421dfc7c24SMarc Zyngier 	if (!skipconf) {
343cb7202c1SSasha Levin 		memset(&ifr, 0, sizeof(ifr));
3449a6d73f1SSasha Levin 		strncpy(ifr.ifr_name, ndev->tap_name, sizeof(ndev->tap_name));
345cb7202c1SSasha Levin 		ioctl(sock, SIOCGIFFLAGS, &ifr);
346cb7202c1SSasha Levin 		ifr.ifr_flags |= IFF_UP | IFF_RUNNING;
347cb7202c1SSasha Levin 		if (ioctl(sock, SIOCSIFFLAGS, &ifr) < 0)
3484542f276SCyrill Gorcunov 			pr_warning("Could not bring tap device up");
3491dfc7c24SMarc Zyngier 	}
350cb7202c1SSasha Levin 
351cb7202c1SSasha Levin 	close(sock);
3523b02f580SSasha Levin 
3533b02f580SSasha Levin 	return 1;
3543b02f580SSasha Levin 
3553b02f580SSasha Levin fail:
3563b02f580SSasha Levin 	if (sock >= 0)
3573b02f580SSasha Levin 		close(sock);
3589a6d73f1SSasha Levin 	if (ndev->tap_fd >= 0)
3599a6d73f1SSasha Levin 		close(ndev->tap_fd);
3603b02f580SSasha Levin 
3613b02f580SSasha Levin 	return 0;
3624f56d42cSAsias He }
3634f56d42cSAsias He 
36459ee54ebSWei Chen static bool virtio_net__tap_create(struct net_dev *ndev)
36559ee54ebSWei Chen {
36659ee54ebSWei Chen 	int offload;
36759ee54ebSWei Chen 	struct ifreq ifr;
36859ee54ebSWei Chen 	const struct virtio_net_params *params = ndev->params;
36959ee54ebSWei Chen 	bool macvtap = (!!params->tapif) && (params->tapif[0] == '/');
37059ee54ebSWei Chen 
37159ee54ebSWei Chen 	/* Did the user already gave us the FD? */
37259ee54ebSWei Chen 	if (params->fd)
37359ee54ebSWei Chen 		ndev->tap_fd = params->fd;
37459ee54ebSWei Chen 	else {
37559ee54ebSWei Chen 		const char *tap_file = "/dev/net/tun";
37659ee54ebSWei Chen 
37759ee54ebSWei Chen 		/* Did the user ask us to use macvtap? */
37859ee54ebSWei Chen 		if (macvtap)
37959ee54ebSWei Chen 			tap_file = params->tapif;
38059ee54ebSWei Chen 
38159ee54ebSWei Chen 		ndev->tap_fd = open(tap_file, O_RDWR);
38259ee54ebSWei Chen 		if (ndev->tap_fd < 0) {
38359ee54ebSWei Chen 			pr_warning("Unable to open %s", tap_file);
38459ee54ebSWei Chen 			return 0;
38559ee54ebSWei Chen 		}
38659ee54ebSWei Chen 	}
38759ee54ebSWei Chen 
38859ee54ebSWei Chen 	if (!macvtap &&
38959ee54ebSWei Chen 	    virtio_net_request_tap(ndev, &ifr, params->tapif) < 0) {
39059ee54ebSWei Chen 		pr_warning("Config tap device error. Are you root?");
39159ee54ebSWei Chen 		goto fail;
39259ee54ebSWei Chen 	}
39359ee54ebSWei Chen 
39459ee54ebSWei Chen 	/*
39559ee54ebSWei Chen 	 * The UFO support had been removed from kernel in commit:
39659ee54ebSWei Chen 	 * ID: fb652fdfe83710da0ca13448a41b7ed027d0a984
39759ee54ebSWei Chen 	 * https://www.spinics.net/lists/netdev/msg443562.html
39859ee54ebSWei Chen 	 * In oder to support the older kernels without this commit,
39959ee54ebSWei Chen 	 * we set the TUN_F_UFO to offload by default to test the status of
40059ee54ebSWei Chen 	 * UFO kernel support.
40159ee54ebSWei Chen 	 */
40259ee54ebSWei Chen 	ndev->tap_ufo = true;
40359ee54ebSWei Chen 	offload = TUN_F_CSUM | TUN_F_TSO4 | TUN_F_TSO6 | TUN_F_UFO;
40459ee54ebSWei Chen 	if (ioctl(ndev->tap_fd, TUNSETOFFLOAD, offload) < 0) {
40559ee54ebSWei Chen 		/*
40659ee54ebSWei Chen 		 * Is this failure caused by kernel remove the UFO support?
40759ee54ebSWei Chen 		 * Try TUNSETOFFLOAD without TUN_F_UFO.
40859ee54ebSWei Chen 		 */
40959ee54ebSWei Chen 		offload &= ~TUN_F_UFO;
41059ee54ebSWei Chen 		if (ioctl(ndev->tap_fd, TUNSETOFFLOAD, offload) < 0) {
41159ee54ebSWei Chen 			pr_warning("Config tap device TUNSETOFFLOAD error");
41259ee54ebSWei Chen 			goto fail;
41359ee54ebSWei Chen 		}
41459ee54ebSWei Chen 		ndev->tap_ufo = false;
41559ee54ebSWei Chen 	}
41659ee54ebSWei Chen 
41759ee54ebSWei Chen 	return 1;
41859ee54ebSWei Chen 
41959ee54ebSWei Chen fail:
42059ee54ebSWei Chen 	if ((ndev->tap_fd >= 0) || (!params->fd) )
42159ee54ebSWei Chen 		close(ndev->tap_fd);
42259ee54ebSWei Chen 
42359ee54ebSWei Chen 	return 0;
42459ee54ebSWei Chen }
42559ee54ebSWei Chen 
426b4fdde6dSAsias He static inline int tap_ops_tx(struct iovec *iov, u16 out, struct net_dev *ndev)
427b4fdde6dSAsias He {
428b4fdde6dSAsias He 	return writev(ndev->tap_fd, iov, out);
429b4fdde6dSAsias He }
430b4fdde6dSAsias He 
431b4fdde6dSAsias He static inline int tap_ops_rx(struct iovec *iov, u16 in, struct net_dev *ndev)
432b4fdde6dSAsias He {
433b4fdde6dSAsias He 	return readv(ndev->tap_fd, iov, in);
434b4fdde6dSAsias He }
435b4fdde6dSAsias He 
436b4fdde6dSAsias He static inline int uip_ops_tx(struct iovec *iov, u16 out, struct net_dev *ndev)
437b4fdde6dSAsias He {
438b4fdde6dSAsias He 	return uip_tx(iov, out, &ndev->info);
439b4fdde6dSAsias He }
440b4fdde6dSAsias He 
441b4fdde6dSAsias He static inline int uip_ops_rx(struct iovec *iov, u16 in, struct net_dev *ndev)
442b4fdde6dSAsias He {
443b4fdde6dSAsias He 	return uip_rx(iov, in, &ndev->info);
444b4fdde6dSAsias He }
445b4fdde6dSAsias He 
446b4fdde6dSAsias He static struct net_dev_operations tap_ops = {
447b4fdde6dSAsias He 	.rx	= tap_ops_rx,
448b4fdde6dSAsias He 	.tx	= tap_ops_tx,
449b4fdde6dSAsias He };
450b4fdde6dSAsias He 
451b4fdde6dSAsias He static struct net_dev_operations uip_ops = {
452b4fdde6dSAsias He 	.rx	= uip_ops_rx,
453b4fdde6dSAsias He 	.tx	= uip_ops_tx,
454b4fdde6dSAsias He };
455b4fdde6dSAsias He 
456c5ae742bSSasha Levin static u8 *get_config(struct kvm *kvm, void *dev)
45778a2a3e2SSasha Levin {
45878a2a3e2SSasha Levin 	struct net_dev *ndev = dev;
45978a2a3e2SSasha Levin 
460c5ae742bSSasha Levin 	return ((u8 *)(&ndev->config));
46178a2a3e2SSasha Levin }
46278a2a3e2SSasha Levin 
46378a2a3e2SSasha Levin static u32 get_host_features(struct kvm *kvm, void *dev)
46478a2a3e2SSasha Levin {
46559ee54ebSWei Chen 	u32 features;
46679052597SSasha Levin 	struct net_dev *ndev = dev;
46779052597SSasha Levin 
46859ee54ebSWei Chen 	features = 1UL << VIRTIO_NET_F_MAC
46978a2a3e2SSasha Levin 		| 1UL << VIRTIO_NET_F_CSUM
47078a2a3e2SSasha Levin 		| 1UL << VIRTIO_NET_F_HOST_TSO4
47178a2a3e2SSasha Levin 		| 1UL << VIRTIO_NET_F_HOST_TSO6
47278a2a3e2SSasha Levin 		| 1UL << VIRTIO_NET_F_GUEST_TSO4
47392c1f37bSSasha Levin 		| 1UL << VIRTIO_NET_F_GUEST_TSO6
474754c8ce3SSasha Levin 		| 1UL << VIRTIO_RING_F_EVENT_IDX
475abd4a801SSasha Levin 		| 1UL << VIRTIO_RING_F_INDIRECT_DESC
4766585ffb7SSasha Levin 		| 1UL << VIRTIO_NET_F_CTRL_VQ
4777668c3a6SSasha Levin 		| 1UL << VIRTIO_NET_F_MRG_RXBUF
47879052597SSasha Levin 		| 1UL << (ndev->queue_pairs > 1 ? VIRTIO_NET_F_MQ : 0);
47959ee54ebSWei Chen 
48059ee54ebSWei Chen 	/*
48159ee54ebSWei Chen 	 * The UFO feature for host and guest only can be enabled when the
48259ee54ebSWei Chen 	 * kernel has TAP UFO support.
48359ee54ebSWei Chen 	 */
48459ee54ebSWei Chen 	if (ndev->tap_ufo)
48559ee54ebSWei Chen 		features |= (1UL << VIRTIO_NET_F_HOST_UFO
48659ee54ebSWei Chen 				| 1UL << VIRTIO_NET_F_GUEST_UFO);
48759ee54ebSWei Chen 
48859ee54ebSWei Chen 	return features;
48978a2a3e2SSasha Levin }
49078a2a3e2SSasha Levin 
49115636d5eSYing-Shiuan Pan static int virtio_net__vhost_set_features(struct net_dev *ndev)
49215636d5eSYing-Shiuan Pan {
49315636d5eSYing-Shiuan Pan 	u64 features = 1UL << VIRTIO_RING_F_EVENT_IDX;
49415636d5eSYing-Shiuan Pan 	u64 vhost_features;
49515636d5eSYing-Shiuan Pan 
49615636d5eSYing-Shiuan Pan 	if (ioctl(ndev->vhost_fd, VHOST_GET_FEATURES, &vhost_features) != 0)
49715636d5eSYing-Shiuan Pan 		die_perror("VHOST_GET_FEATURES failed");
49815636d5eSYing-Shiuan Pan 
49915636d5eSYing-Shiuan Pan 	/* make sure both side support mergable rx buffers */
50015636d5eSYing-Shiuan Pan 	if (vhost_features & 1UL << VIRTIO_NET_F_MRG_RXBUF &&
50115636d5eSYing-Shiuan Pan 			has_virtio_feature(ndev, VIRTIO_NET_F_MRG_RXBUF))
50215636d5eSYing-Shiuan Pan 		features |= 1UL << VIRTIO_NET_F_MRG_RXBUF;
50315636d5eSYing-Shiuan Pan 
50415636d5eSYing-Shiuan Pan 	return ioctl(ndev->vhost_fd, VHOST_SET_FEATURES, &features);
50515636d5eSYing-Shiuan Pan }
50615636d5eSYing-Shiuan Pan 
50778a2a3e2SSasha Levin static void set_guest_features(struct kvm *kvm, void *dev, u32 features)
50878a2a3e2SSasha Levin {
50978a2a3e2SSasha Levin 	struct net_dev *ndev = dev;
5108ed60bbeSMarc Zyngier 	struct virtio_net_config *conf = &ndev->config;
51178a2a3e2SSasha Levin 
51278a2a3e2SSasha Levin 	ndev->features = features;
5138aa155c4SYing-Shiuan Pan 
5148ed60bbeSMarc Zyngier 	conf->status = virtio_host_to_guest_u16(&ndev->vdev, conf->status);
5158ed60bbeSMarc Zyngier 	conf->max_virtqueue_pairs = virtio_host_to_guest_u16(&ndev->vdev,
5168ed60bbeSMarc Zyngier 							     conf->max_virtqueue_pairs);
51795242e44SJean-Philippe Brucker }
5188ed60bbeSMarc Zyngier 
51995242e44SJean-Philippe Brucker static void virtio_net_start(struct net_dev *ndev)
52095242e44SJean-Philippe Brucker {
5218aa155c4SYing-Shiuan Pan 	if (ndev->mode == NET_MODE_TAP) {
5228aa155c4SYing-Shiuan Pan 		if (!virtio_net__tap_init(ndev))
52359ee54ebSWei Chen 			die_perror("TAP device initialized failed because");
52459ee54ebSWei Chen 
52515636d5eSYing-Shiuan Pan 		if (ndev->vhost_fd &&
52615636d5eSYing-Shiuan Pan 				virtio_net__vhost_set_features(ndev) != 0)
52715636d5eSYing-Shiuan Pan 			die_perror("VHOST_SET_FEATURES failed");
5288aa155c4SYing-Shiuan Pan 	} else {
5298aa155c4SYing-Shiuan Pan 		ndev->info.vnet_hdr_len = has_virtio_feature(ndev, VIRTIO_NET_F_MRG_RXBUF) ?
5308aa155c4SYing-Shiuan Pan 						sizeof(struct virtio_net_hdr_mrg_rxbuf) :
5318aa155c4SYing-Shiuan Pan 						sizeof(struct virtio_net_hdr);
5328aa155c4SYing-Shiuan Pan 		uip_init(&ndev->info);
5338aa155c4SYing-Shiuan Pan 	}
53478a2a3e2SSasha Levin }
53578a2a3e2SSasha Levin 
53695242e44SJean-Philippe Brucker static void notify_status(struct kvm *kvm, void *dev, u32 status)
53795242e44SJean-Philippe Brucker {
53895242e44SJean-Philippe Brucker 	if (status & VIRTIO__STATUS_START)
53995242e44SJean-Philippe Brucker 		virtio_net_start(dev);
54095242e44SJean-Philippe Brucker }
54195242e44SJean-Philippe Brucker 
5429e56ec14SSasha Levin static bool is_ctrl_vq(struct net_dev *ndev, u32 vq)
5439e56ec14SSasha Levin {
5449e56ec14SSasha Levin 	return vq == (u32)(ndev->queue_pairs * 2);
5459e56ec14SSasha Levin }
5469e56ec14SSasha Levin 
547c59ba304SWill Deacon static int init_vq(struct kvm *kvm, void *dev, u32 vq, u32 page_size, u32 align,
548c59ba304SWill Deacon 		   u32 pfn)
54978a2a3e2SSasha Levin {
5509ed67cdcSSasha Levin 	struct vhost_vring_state state = { .index = vq };
551*ad96e867SJean-Philippe Brucker 	struct net_dev_queue *net_queue;
5529ed67cdcSSasha Levin 	struct vhost_vring_addr addr;
55378a2a3e2SSasha Levin 	struct net_dev *ndev = dev;
55478a2a3e2SSasha Levin 	struct virt_queue *queue;
55578a2a3e2SSasha Levin 	void *p;
5569ed67cdcSSasha Levin 	int r;
55778a2a3e2SSasha Levin 
558312c62d1SSasha Levin 	compat__remove_message(compat_id);
55978a2a3e2SSasha Levin 
560*ad96e867SJean-Philippe Brucker 	net_queue	= &ndev->queues[vq];
561*ad96e867SJean-Philippe Brucker 	net_queue->id	= vq;
562*ad96e867SJean-Philippe Brucker 	net_queue->ndev	= ndev;
563*ad96e867SJean-Philippe Brucker 	queue		= &net_queue->vq;
56478a2a3e2SSasha Levin 	queue->pfn	= pfn;
565e7e2950aSSasha Levin 	p		= virtio_get_vq(kvm, queue->pfn, page_size);
56678a2a3e2SSasha Levin 
567c59ba304SWill Deacon 	vring_init(&queue->vring, VIRTIO_NET_QUEUE_SIZE, p, align);
5688ed60bbeSMarc Zyngier 	virtio_init_device_vq(&ndev->vdev, queue);
56978a2a3e2SSasha Levin 
570*ad96e867SJean-Philippe Brucker 	mutex_init(&net_queue->lock);
571*ad96e867SJean-Philippe Brucker 	pthread_cond_init(&net_queue->cond, NULL);
5729e56ec14SSasha Levin 	if (is_ctrl_vq(ndev, vq)) {
573*ad96e867SJean-Philippe Brucker 		pthread_create(&net_queue->thread, NULL, virtio_net_ctrl_thread,
574*ad96e867SJean-Philippe Brucker 			       net_queue);
5759e56ec14SSasha Levin 
5769e56ec14SSasha Levin 		return 0;
5779e56ec14SSasha Levin 	} else if (ndev->vhost_fd == 0 ) {
5789e56ec14SSasha Levin 		if (vq & 1)
579*ad96e867SJean-Philippe Brucker 			pthread_create(&net_queue->thread, NULL,
580*ad96e867SJean-Philippe Brucker 				       virtio_net_tx_thread, net_queue);
5816585ffb7SSasha Levin 		else
582*ad96e867SJean-Philippe Brucker 			pthread_create(&net_queue->thread, NULL,
583*ad96e867SJean-Philippe Brucker 				       virtio_net_rx_thread, net_queue);
5846585ffb7SSasha Levin 
58578a2a3e2SSasha Levin 		return 0;
5866585ffb7SSasha Levin 	}
5879ed67cdcSSasha Levin 
5888ed60bbeSMarc Zyngier 	if (queue->endian != VIRTIO_ENDIAN_HOST)
589b960f243SAndre Przywara 		die_perror("VHOST requires the same endianness in guest and host");
5908ed60bbeSMarc Zyngier 
5919ed67cdcSSasha Levin 	state.num = queue->vring.num;
5929ed67cdcSSasha Levin 	r = ioctl(ndev->vhost_fd, VHOST_SET_VRING_NUM, &state);
5939ed67cdcSSasha Levin 	if (r < 0)
5949ed67cdcSSasha Levin 		die_perror("VHOST_SET_VRING_NUM failed");
5959ed67cdcSSasha Levin 	state.num = 0;
5969ed67cdcSSasha Levin 	r = ioctl(ndev->vhost_fd, VHOST_SET_VRING_BASE, &state);
5979ed67cdcSSasha Levin 	if (r < 0)
5989ed67cdcSSasha Levin 		die_perror("VHOST_SET_VRING_BASE failed");
5999ed67cdcSSasha Levin 
6009ed67cdcSSasha Levin 	addr = (struct vhost_vring_addr) {
6019ed67cdcSSasha Levin 		.index = vq,
6029ed67cdcSSasha Levin 		.desc_user_addr = (u64)(unsigned long)queue->vring.desc,
6039ed67cdcSSasha Levin 		.avail_user_addr = (u64)(unsigned long)queue->vring.avail,
6049ed67cdcSSasha Levin 		.used_user_addr = (u64)(unsigned long)queue->vring.used,
6059ed67cdcSSasha Levin 	};
6069ed67cdcSSasha Levin 
6079ed67cdcSSasha Levin 	r = ioctl(ndev->vhost_fd, VHOST_SET_VRING_ADDR, &addr);
6089ed67cdcSSasha Levin 	if (r < 0)
6099ed67cdcSSasha Levin 		die_perror("VHOST_SET_VRING_ADDR failed");
6109ed67cdcSSasha Levin 
6119ed67cdcSSasha Levin 	return 0;
6129ed67cdcSSasha Levin }
6139ed67cdcSSasha Levin 
6149ed67cdcSSasha Levin static void notify_vq_gsi(struct kvm *kvm, void *dev, u32 vq, u32 gsi)
6159ed67cdcSSasha Levin {
6169ed67cdcSSasha Levin 	struct net_dev *ndev = dev;
617*ad96e867SJean-Philippe Brucker 	struct net_dev_queue *queue = &ndev->queues[vq];
6189ed67cdcSSasha Levin 	struct vhost_vring_file file;
6199ed67cdcSSasha Levin 	int r;
6209ed67cdcSSasha Levin 
6219ed67cdcSSasha Levin 	if (ndev->vhost_fd == 0)
6229ed67cdcSSasha Levin 		return;
6239ed67cdcSSasha Levin 
6249ed67cdcSSasha Levin 	file = (struct vhost_vring_file) {
6259ed67cdcSSasha Levin 		.index	= vq,
626e59679d2SJean-Philippe Brucker 		.fd	= eventfd(0, 0),
6279ed67cdcSSasha Levin 	};
6289ed67cdcSSasha Levin 
629e59679d2SJean-Philippe Brucker 	r = irq__add_irqfd(kvm, gsi, file.fd, -1);
6309ed67cdcSSasha Levin 	if (r < 0)
6319ed67cdcSSasha Levin 		die_perror("KVM_IRQFD failed");
6329ed67cdcSSasha Levin 
6339ed67cdcSSasha Levin 	r = ioctl(ndev->vhost_fd, VHOST_SET_VRING_CALL, &file);
6349ed67cdcSSasha Levin 	if (r < 0)
6359ed67cdcSSasha Levin 		die_perror("VHOST_SET_VRING_CALL failed");
6369ed67cdcSSasha Levin 	file.fd = ndev->tap_fd;
6379ed67cdcSSasha Levin 	r = ioctl(ndev->vhost_fd, VHOST_NET_SET_BACKEND, &file);
6389ed67cdcSSasha Levin 	if (r != 0)
6399ed67cdcSSasha Levin 		die("VHOST_NET_SET_BACKEND failed %d", errno);
6409ed67cdcSSasha Levin 
6419ed67cdcSSasha Levin }
6429ed67cdcSSasha Levin 
6439ed67cdcSSasha Levin static void notify_vq_eventfd(struct kvm *kvm, void *dev, u32 vq, u32 efd)
6449ed67cdcSSasha Levin {
6459ed67cdcSSasha Levin 	struct net_dev *ndev = dev;
6469ed67cdcSSasha Levin 	struct vhost_vring_file file = {
6479ed67cdcSSasha Levin 		.index	= vq,
6489ed67cdcSSasha Levin 		.fd	= efd,
6499ed67cdcSSasha Levin 	};
6509ed67cdcSSasha Levin 	int r;
6519ed67cdcSSasha Levin 
6529e56ec14SSasha Levin 	if (ndev->vhost_fd == 0 || is_ctrl_vq(ndev, vq))
6539ed67cdcSSasha Levin 		return;
6549ed67cdcSSasha Levin 
6559ed67cdcSSasha Levin 	r = ioctl(ndev->vhost_fd, VHOST_SET_VRING_KICK, &file);
6569ed67cdcSSasha Levin 	if (r < 0)
6579ed67cdcSSasha Levin 		die_perror("VHOST_SET_VRING_KICK failed");
65878a2a3e2SSasha Levin }
65978a2a3e2SSasha Levin 
66078a2a3e2SSasha Levin static int notify_vq(struct kvm *kvm, void *dev, u32 vq)
66178a2a3e2SSasha Levin {
6629a6d73f1SSasha Levin 	struct net_dev *ndev = dev;
6639a6d73f1SSasha Levin 
6649a6d73f1SSasha Levin 	virtio_net_handle_callback(kvm, ndev, vq);
66578a2a3e2SSasha Levin 
66678a2a3e2SSasha Levin 	return 0;
66778a2a3e2SSasha Levin }
66878a2a3e2SSasha Levin 
66953fbb17bSJean-Philippe Brucker static struct virt_queue *get_vq(struct kvm *kvm, void *dev, u32 vq)
67078a2a3e2SSasha Levin {
67178a2a3e2SSasha Levin 	struct net_dev *ndev = dev;
67278a2a3e2SSasha Levin 
673*ad96e867SJean-Philippe Brucker 	return &ndev->queues[vq].vq;
67478a2a3e2SSasha Levin }
67578a2a3e2SSasha Levin 
67678a2a3e2SSasha Levin static int get_size_vq(struct kvm *kvm, void *dev, u32 vq)
67778a2a3e2SSasha Levin {
6780f4f51a8SAsias He 	/* FIXME: dynamic */
67978a2a3e2SSasha Levin 	return VIRTIO_NET_QUEUE_SIZE;
68078a2a3e2SSasha Levin }
68178a2a3e2SSasha Levin 
6820f4f51a8SAsias He static int set_size_vq(struct kvm *kvm, void *dev, u32 vq, int size)
6830f4f51a8SAsias He {
6840f4f51a8SAsias He 	/* FIXME: dynamic */
6850f4f51a8SAsias He 	return size;
6860f4f51a8SAsias He }
6870f4f51a8SAsias He 
688b98ac591SJean-Philippe Brucker static int get_vq_count(struct kvm *kvm, void *dev)
689b98ac591SJean-Philippe Brucker {
690b98ac591SJean-Philippe Brucker 	struct net_dev *ndev = dev;
691b98ac591SJean-Philippe Brucker 
692b98ac591SJean-Philippe Brucker 	return ndev->queue_pairs * 2 + 1;
693b98ac591SJean-Philippe Brucker }
694b98ac591SJean-Philippe Brucker 
69515542babSAndre Przywara static struct virtio_ops net_dev_virtio_ops = {
6961c47ce69SSasha Levin 	.get_config		= get_config,
6971c47ce69SSasha Levin 	.get_host_features	= get_host_features,
6981c47ce69SSasha Levin 	.set_guest_features	= set_guest_features,
699b98ac591SJean-Philippe Brucker 	.get_vq_count		= get_vq_count,
7001c47ce69SSasha Levin 	.init_vq		= init_vq,
70153fbb17bSJean-Philippe Brucker 	.get_vq			= get_vq,
7021c47ce69SSasha Levin 	.get_size_vq		= get_size_vq,
7030f4f51a8SAsias He 	.set_size_vq		= set_size_vq,
7040f4f51a8SAsias He 	.notify_vq		= notify_vq,
7059ed67cdcSSasha Levin 	.notify_vq_gsi		= notify_vq_gsi,
7069ed67cdcSSasha Levin 	.notify_vq_eventfd	= notify_vq_eventfd,
70795242e44SJean-Philippe Brucker 	.notify_status		= notify_status,
7081c47ce69SSasha Levin };
7091c47ce69SSasha Levin 
7109ed67cdcSSasha Levin static void virtio_net__vhost_init(struct kvm *kvm, struct net_dev *ndev)
7119ed67cdcSSasha Levin {
7127f9733c2SAndreas Herrmann 	struct kvm_mem_bank *bank;
7139ed67cdcSSasha Levin 	struct vhost_memory *mem;
7147f9733c2SAndreas Herrmann 	int r, i;
7159ed67cdcSSasha Levin 
7169ed67cdcSSasha Levin 	ndev->vhost_fd = open("/dev/vhost-net", O_RDWR);
7179ed67cdcSSasha Levin 	if (ndev->vhost_fd < 0)
7189ed67cdcSSasha Levin 		die_perror("Failed openning vhost-net device");
7199ed67cdcSSasha Levin 
7207f9733c2SAndreas Herrmann 	mem = calloc(1, sizeof(*mem) + kvm->mem_slots * sizeof(struct vhost_memory_region));
7219ed67cdcSSasha Levin 	if (mem == NULL)
7229ed67cdcSSasha Levin 		die("Failed allocating memory for vhost memory map");
7239ed67cdcSSasha Levin 
7247f9733c2SAndreas Herrmann 	i = 0;
7257f9733c2SAndreas Herrmann 	list_for_each_entry(bank, &kvm->mem_banks, list) {
7267f9733c2SAndreas Herrmann 		mem->regions[i] = (struct vhost_memory_region) {
7277f9733c2SAndreas Herrmann 			.guest_phys_addr = bank->guest_phys_addr,
7287f9733c2SAndreas Herrmann 			.memory_size	 = bank->size,
7297f9733c2SAndreas Herrmann 			.userspace_addr	 = (unsigned long)bank->host_addr,
7309ed67cdcSSasha Levin 		};
7317f9733c2SAndreas Herrmann 		i++;
7327f9733c2SAndreas Herrmann 	}
7337f9733c2SAndreas Herrmann 	mem->nregions = i;
7349ed67cdcSSasha Levin 
7359ed67cdcSSasha Levin 	r = ioctl(ndev->vhost_fd, VHOST_SET_OWNER);
7369ed67cdcSSasha Levin 	if (r != 0)
7379ed67cdcSSasha Levin 		die_perror("VHOST_SET_OWNER failed");
7389ed67cdcSSasha Levin 
7399ed67cdcSSasha Levin 	r = ioctl(ndev->vhost_fd, VHOST_SET_MEM_TABLE, mem);
7409ed67cdcSSasha Levin 	if (r != 0)
7419ed67cdcSSasha Levin 		die_perror("VHOST_SET_MEM_TABLE failed");
742627d6874SAsias He 
743627d6874SAsias He 	ndev->vdev.use_vhost = true;
744627d6874SAsias He 
7459ed67cdcSSasha Levin 	free(mem);
7469ed67cdcSSasha Levin }
7479ed67cdcSSasha Levin 
7485f225124SSasha Levin static inline void str_to_mac(const char *str, char *mac)
7495f225124SSasha Levin {
7505f225124SSasha Levin 	sscanf(str, "%hhx:%hhx:%hhx:%hhx:%hhx:%hhx",
7515f225124SSasha Levin 		mac, mac+1, mac+2, mac+3, mac+4, mac+5);
7525f225124SSasha Levin }
7534346fd8fSSasha Levin static int set_net_param(struct kvm *kvm, struct virtio_net_params *p,
7544346fd8fSSasha Levin 			const char *param, const char *val)
7555f225124SSasha Levin {
7565f225124SSasha Levin 	if (strcmp(param, "guest_mac") == 0) {
7575f225124SSasha Levin 		str_to_mac(val, p->guest_mac);
7585f225124SSasha Levin 	} else if (strcmp(param, "mode") == 0) {
7595f225124SSasha Levin 		if (!strncmp(val, "user", 4)) {
7605f225124SSasha Levin 			int i;
7615f225124SSasha Levin 
7625f225124SSasha Levin 			for (i = 0; i < kvm->cfg.num_net_devices; i++)
7635f225124SSasha Levin 				if (kvm->cfg.net_params[i].mode == NET_MODE_USER)
7645f225124SSasha Levin 					die("Only one usermode network device allowed at a time");
7655f225124SSasha Levin 			p->mode = NET_MODE_USER;
7665f225124SSasha Levin 		} else if (!strncmp(val, "tap", 3)) {
7675f225124SSasha Levin 			p->mode = NET_MODE_TAP;
7685f225124SSasha Levin 		} else if (!strncmp(val, "none", 4)) {
7695f225124SSasha Levin 			kvm->cfg.no_net = 1;
7705f225124SSasha Levin 			return -1;
7715f225124SSasha Levin 		} else
7725f225124SSasha Levin 			die("Unknown network mode %s, please use user, tap or none", kvm->cfg.network);
7735f225124SSasha Levin 	} else if (strcmp(param, "script") == 0) {
7745f225124SSasha Levin 		p->script = strdup(val);
775eef27ae3SFan Du 	} else if (strcmp(param, "downscript") == 0) {
776eef27ae3SFan Du 		p->downscript = strdup(val);
7775f225124SSasha Levin 	} else if (strcmp(param, "guest_ip") == 0) {
7785f225124SSasha Levin 		p->guest_ip = strdup(val);
7795f225124SSasha Levin 	} else if (strcmp(param, "host_ip") == 0) {
7805f225124SSasha Levin 		p->host_ip = strdup(val);
7815f225124SSasha Levin 	} else if (strcmp(param, "trans") == 0) {
7825f225124SSasha Levin 		p->trans = strdup(val);
7831dfc7c24SMarc Zyngier 	} else if (strcmp(param, "tapif") == 0) {
7841dfc7c24SMarc Zyngier 		p->tapif = strdup(val);
7855f225124SSasha Levin 	} else if (strcmp(param, "vhost") == 0) {
7865f225124SSasha Levin 		p->vhost = atoi(val);
7875f225124SSasha Levin 	} else if (strcmp(param, "fd") == 0) {
7885f225124SSasha Levin 		p->fd = atoi(val);
78979052597SSasha Levin 	} else if (strcmp(param, "mq") == 0) {
79079052597SSasha Levin 		p->mq = atoi(val);
7915f225124SSasha Levin 	} else
7925f225124SSasha Levin 		die("Unknown network parameter %s", param);
7935f225124SSasha Levin 
7945f225124SSasha Levin 	return 0;
7955f225124SSasha Levin }
7965f225124SSasha Levin 
7975f225124SSasha Levin int netdev_parser(const struct option *opt, const char *arg, int unset)
7985f225124SSasha Levin {
7995f225124SSasha Levin 	struct virtio_net_params p;
8005f225124SSasha Levin 	char *buf = NULL, *cmd = NULL, *cur = NULL;
8015f225124SSasha Levin 	bool on_cmd = true;
8025f225124SSasha Levin 	struct kvm *kvm = opt->ptr;
8035f225124SSasha Levin 
8045f225124SSasha Levin 	if (arg) {
8055f225124SSasha Levin 		buf = strdup(arg);
8065f225124SSasha Levin 		if (buf == NULL)
8075f225124SSasha Levin 			die("Failed allocating new net buffer");
8085f225124SSasha Levin 		cur = strtok(buf, ",=");
8095f225124SSasha Levin 	}
8105f225124SSasha Levin 
8115f225124SSasha Levin 	p = (struct virtio_net_params) {
8125f225124SSasha Levin 		.guest_ip	= DEFAULT_GUEST_ADDR,
8135f225124SSasha Levin 		.host_ip	= DEFAULT_HOST_ADDR,
8145f225124SSasha Levin 		.script		= DEFAULT_SCRIPT,
815eef27ae3SFan Du 		.downscript	= DEFAULT_SCRIPT,
8165f225124SSasha Levin 		.mode		= NET_MODE_TAP,
8175f225124SSasha Levin 	};
8185f225124SSasha Levin 
8195f225124SSasha Levin 	str_to_mac(DEFAULT_GUEST_MAC, p.guest_mac);
8205f225124SSasha Levin 	p.guest_mac[5] += kvm->cfg.num_net_devices;
8215f225124SSasha Levin 
8225f225124SSasha Levin 	while (cur) {
8235f225124SSasha Levin 		if (on_cmd) {
8245f225124SSasha Levin 			cmd = cur;
8255f225124SSasha Levin 		} else {
8264346fd8fSSasha Levin 			if (set_net_param(kvm, &p, cmd, cur) < 0)
8275f225124SSasha Levin 				goto done;
8285f225124SSasha Levin 		}
8295f225124SSasha Levin 		on_cmd = !on_cmd;
8305f225124SSasha Levin 
8315f225124SSasha Levin 		cur = strtok(NULL, ",=");
8325f225124SSasha Levin 	};
8335f225124SSasha Levin 
8345f225124SSasha Levin 	kvm->cfg.num_net_devices++;
8355f225124SSasha Levin 
8365f225124SSasha Levin 	kvm->cfg.net_params = realloc(kvm->cfg.net_params, kvm->cfg.num_net_devices * sizeof(*kvm->cfg.net_params));
8375f225124SSasha Levin 	if (kvm->cfg.net_params == NULL)
8385f225124SSasha Levin 		die("Failed adding new network device");
8395f225124SSasha Levin 
8405f225124SSasha Levin 	kvm->cfg.net_params[kvm->cfg.num_net_devices - 1] = p;
8415f225124SSasha Levin 
8425f225124SSasha Levin done:
8435f225124SSasha Levin 	free(buf);
8445f225124SSasha Levin 	return 0;
8455f225124SSasha Levin }
8465f225124SSasha Levin 
8475f225124SSasha Levin static int virtio_net__init_one(struct virtio_net_params *params)
8484f56d42cSAsias He {
84976a4aac6SWill Deacon 	int i, err;
8509a6d73f1SSasha Levin 	struct net_dev *ndev;
85176a4aac6SWill Deacon 	struct virtio_ops *ops;
852dc7a55d6SSuzuki K. Poulose 	enum virtio_trans trans = VIRTIO_DEFAULT_TRANS(params->kvm);
8539a6d73f1SSasha Levin 
8549a6d73f1SSasha Levin 	ndev = calloc(1, sizeof(struct net_dev));
8559a6d73f1SSasha Levin 	if (ndev == NULL)
8565f225124SSasha Levin 		return -ENOMEM;
8579a6d73f1SSasha Levin 
85876a4aac6SWill Deacon 	ops = malloc(sizeof(*ops));
85976a4aac6SWill Deacon 	if (ops == NULL) {
86076a4aac6SWill Deacon 		err = -ENOMEM;
86176a4aac6SWill Deacon 		goto err_free_ndev;
86276a4aac6SWill Deacon 	}
86376a4aac6SWill Deacon 
8649a6d73f1SSasha Levin 	list_add_tail(&ndev->list, &ndevs);
8659a6d73f1SSasha Levin 
8669a6d73f1SSasha Levin 	ndev->kvm = params->kvm;
8678c0ae74dSSasha Levin 	ndev->params = params;
8689a6d73f1SSasha Levin 
8699a6d73f1SSasha Levin 	mutex_init(&ndev->mutex);
87079052597SSasha Levin 	ndev->queue_pairs = max(1, min(VIRTIO_NET_NUM_QUEUES, params->mq));
8719a6d73f1SSasha Levin 	ndev->config.status = VIRTIO_NET_S_LINK_UP;
87279052597SSasha Levin 	if (ndev->queue_pairs > 1)
87379052597SSasha Levin 		ndev->config.max_virtqueue_pairs = ndev->queue_pairs;
87479052597SSasha Levin 
8750c54698eSAsias He 	for (i = 0 ; i < 6 ; i++) {
8769a6d73f1SSasha Levin 		ndev->config.mac[i]		= params->guest_mac[i];
8779a6d73f1SSasha Levin 		ndev->info.guest_mac.addr[i]	= params->guest_mac[i];
8789a6d73f1SSasha Levin 		ndev->info.host_mac.addr[i]	= params->host_mac[i];
8790c54698eSAsias He 	}
880f715177dSAsias He 
8819a6d73f1SSasha Levin 	ndev->mode = params->mode;
8829a6d73f1SSasha Levin 	if (ndev->mode == NET_MODE_TAP) {
8839a6d73f1SSasha Levin 		ndev->ops = &tap_ops;
88459ee54ebSWei Chen 		if (!virtio_net__tap_create(ndev))
88559ee54ebSWei Chen 			die_perror("You have requested a TAP device, but creation of one has failed because");
886b4fdde6dSAsias He 	} else {
8879a6d73f1SSasha Levin 		ndev->info.host_ip		= ntohl(inet_addr(params->host_ip));
8889a6d73f1SSasha Levin 		ndev->info.guest_ip		= ntohl(inet_addr(params->guest_ip));
8899a6d73f1SSasha Levin 		ndev->info.guest_netmask	= ntohl(inet_addr("255.255.255.0"));
8909a6d73f1SSasha Levin 		ndev->info.buf_nr		= 20,
8919a6d73f1SSasha Levin 		ndev->ops = &uip_ops;
8925f3aaf22SMarc Zyngier 		uip_static_init(&ndev->info);
893b4fdde6dSAsias He 	}
894b5ee1ea7SAsias He 
89576a4aac6SWill Deacon 	*ops = net_dev_virtio_ops;
896dc7a55d6SSuzuki K. Poulose 
897dc7a55d6SSuzuki K. Poulose 	if (params->trans) {
898dc7a55d6SSuzuki K. Poulose 		if (strcmp(params->trans, "mmio") == 0)
899dc7a55d6SSuzuki K. Poulose 			trans = VIRTIO_MMIO;
900dc7a55d6SSuzuki K. Poulose 		else if (strcmp(params->trans, "pci") == 0)
901dc7a55d6SSuzuki K. Poulose 			trans = VIRTIO_PCI;
90269205aa1SAsias He 		else
903dc7a55d6SSuzuki K. Poulose 			pr_warning("virtio-net: Unknown transport method : %s, "
904dc7a55d6SSuzuki K. Poulose 				   "falling back to %s.", params->trans,
905dc7a55d6SSuzuki K. Poulose 				   virtio_trans_name(trans));
906dc7a55d6SSuzuki K. Poulose 	}
907dc7a55d6SSuzuki K. Poulose 
908dc7a55d6SSuzuki K. Poulose 	virtio_init(params->kvm, ndev, &ndev->vdev, ops, trans,
90976a4aac6SWill Deacon 		    PCI_DEVICE_ID_VIRTIO_NET, VIRTIO_ID_NET, PCI_CLASS_NET);
91027ab67f5SSasha Levin 
9119ed67cdcSSasha Levin 	if (params->vhost)
9129ed67cdcSSasha Levin 		virtio_net__vhost_init(params->kvm, ndev);
913cb83de6fSSasha Levin 
914d278197dSAsias He 	if (compat_id == -1)
91552f34d2cSAsias He 		compat_id = virtio_compat_add_message("virtio-net", "CONFIG_VIRTIO_NET");
9165f225124SSasha Levin 
9175f225124SSasha Levin 	return 0;
91876a4aac6SWill Deacon 
91976a4aac6SWill Deacon err_free_ndev:
92076a4aac6SWill Deacon 	free(ndev);
92176a4aac6SWill Deacon 	return err;
9225f225124SSasha Levin }
9235f225124SSasha Levin 
9245f225124SSasha Levin int virtio_net__init(struct kvm *kvm)
9255f225124SSasha Levin {
9265f225124SSasha Levin 	int i;
9275f225124SSasha Levin 
9285f225124SSasha Levin 	for (i = 0; i < kvm->cfg.num_net_devices; i++) {
9295f225124SSasha Levin 		kvm->cfg.net_params[i].kvm = kvm;
9305f225124SSasha Levin 		virtio_net__init_one(&kvm->cfg.net_params[i]);
9315f225124SSasha Levin 	}
9325f225124SSasha Levin 
9335f225124SSasha Levin 	if (kvm->cfg.num_net_devices == 0 && kvm->cfg.no_net == 0) {
9348c0ae74dSSasha Levin 		static struct virtio_net_params net_params;
9355f225124SSasha Levin 
9365f225124SSasha Levin 		net_params = (struct virtio_net_params) {
9375f225124SSasha Levin 			.guest_ip	= kvm->cfg.guest_ip,
9385f225124SSasha Levin 			.host_ip	= kvm->cfg.host_ip,
9395f225124SSasha Levin 			.kvm		= kvm,
9405f225124SSasha Levin 			.script		= kvm->cfg.script,
9415f225124SSasha Levin 			.mode		= NET_MODE_USER,
9425f225124SSasha Levin 		};
9435f225124SSasha Levin 		str_to_mac(kvm->cfg.guest_mac, net_params.guest_mac);
9445f225124SSasha Levin 		str_to_mac(kvm->cfg.host_mac, net_params.host_mac);
9455f225124SSasha Levin 
9465f225124SSasha Levin 		virtio_net__init_one(&net_params);
9475f225124SSasha Levin 	}
9485f225124SSasha Levin 
9495f225124SSasha Levin 	return 0;
9505f225124SSasha Levin }
95149a8afd1SSasha Levin virtio_dev_init(virtio_net__init);
9525f225124SSasha Levin 
9535f225124SSasha Levin int virtio_net__exit(struct kvm *kvm)
9545f225124SSasha Levin {
955eef27ae3SFan Du 	struct virtio_net_params *params;
956eef27ae3SFan Du 	struct net_dev *ndev;
957eef27ae3SFan Du 	struct list_head *ptr;
958eef27ae3SFan Du 
959eef27ae3SFan Du 	list_for_each(ptr, &ndevs) {
960eef27ae3SFan Du 		ndev = list_entry(ptr, struct net_dev, list);
961eef27ae3SFan Du 		params = ndev->params;
962eef27ae3SFan Du 		/* Cleanup any tap device which attached to bridge */
963eef27ae3SFan Du 		if (ndev->mode == NET_MODE_TAP &&
964eef27ae3SFan Du 		    strcmp(params->downscript, "none"))
965eef27ae3SFan Du 			virtio_net_exec_script(params->downscript, ndev->tap_name);
966eef27ae3SFan Du 	}
9675f225124SSasha Levin 	return 0;
9684f56d42cSAsias He }
96949a8afd1SSasha Levin virtio_dev_exit(virtio_net__exit);
970