xref: /kvmtool/virtio/net.c (revision 74af1456dfa0c3fb1c79529450c6130b54fd1c83)
131638bcaSCyrill Gorcunov #include "kvm/virtio-pci-dev.h"
2b5ee1ea7SAsias He #include "kvm/virtio-net.h"
34f56d42cSAsias He #include "kvm/virtio.h"
44f56d42cSAsias He #include "kvm/mutex.h"
54f56d42cSAsias He #include "kvm/util.h"
64f56d42cSAsias He #include "kvm/kvm.h"
7b5ee1ea7SAsias He #include "kvm/uip.h"
8cb83de6fSSasha Levin #include "kvm/guest_compat.h"
97668c3a6SSasha Levin #include "kvm/iovec.h"
1005755b29SAndre Przywara #include "kvm/strbuf.h"
114f56d42cSAsias He 
12029cd2bbSJean-Philippe Brucker #include <linux/list.h>
139ed67cdcSSasha Levin #include <linux/vhost.h>
144f56d42cSAsias He #include <linux/virtio_net.h>
154f56d42cSAsias He #include <linux/if_tun.h>
1678a2a3e2SSasha Levin #include <linux/types.h>
17c229370aSIngo Molnar 
18c229370aSIngo Molnar #include <arpa/inet.h>
194f56d42cSAsias He #include <net/if.h>
20c229370aSIngo Molnar 
21c229370aSIngo Molnar #include <unistd.h>
224f56d42cSAsias He #include <fcntl.h>
23c229370aSIngo Molnar 
24cb7202c1SSasha Levin #include <sys/socket.h>
25c229370aSIngo Molnar #include <sys/ioctl.h>
26c229370aSIngo Molnar #include <sys/types.h>
2773b7d038SAmos Kong #include <sys/wait.h>
284f56d42cSAsias He 
294059ad8bSAsias He #define VIRTIO_NET_QUEUE_SIZE		256
306585ffb7SSasha Levin #define VIRTIO_NET_NUM_QUEUES		8
314f56d42cSAsias He 
32b4fdde6dSAsias He struct net_dev;
33b4fdde6dSAsias He 
34b4fdde6dSAsias He struct net_dev_operations {
35b4fdde6dSAsias He 	int (*rx)(struct iovec *iov, u16 in, struct net_dev *ndev);
36b4fdde6dSAsias He 	int (*tx)(struct iovec *iov, u16 in, struct net_dev *ndev);
37b4fdde6dSAsias He };
38b4fdde6dSAsias He 
39ad96e867SJean-Philippe Brucker struct net_dev_queue {
40ad96e867SJean-Philippe Brucker 	int				id;
41ad96e867SJean-Philippe Brucker 	struct net_dev			*ndev;
42ad96e867SJean-Philippe Brucker 	struct virt_queue		vq;
43ad96e867SJean-Philippe Brucker 	pthread_t			thread;
44ad96e867SJean-Philippe Brucker 	struct mutex			lock;
45ad96e867SJean-Philippe Brucker 	pthread_cond_t			cond;
46ad96e867SJean-Philippe Brucker };
47ad96e867SJean-Philippe Brucker 
488626798bSAsias He struct net_dev {
49d3476f7dSSasha Levin 	struct mutex			mutex;
5002eca50cSAsias He 	struct virtio_device		vdev;
519a6d73f1SSasha Levin 	struct list_head		list;
524f56d42cSAsias He 
53ad96e867SJean-Philippe Brucker 	struct net_dev_queue		queues[VIRTIO_NET_NUM_QUEUES * 2 + 1];
54c229370aSIngo Molnar 	struct virtio_net_config	config;
55902a8ecbSJean-Philippe Brucker 	u32				queue_pairs;
56c4aa7c02SPekka Enberg 
579ed67cdcSSasha Levin 	int				vhost_fd;
584f56d42cSAsias He 	int				tap_fd;
594f56d42cSAsias He 	char				tap_name[IFNAMSIZ];
6059ee54ebSWei Chen 	bool				tap_ufo;
61bb1a32f1SAsias He 
62bb1a32f1SAsias He 	int				mode;
63bb1a32f1SAsias He 
64b5ee1ea7SAsias He 	struct uip_info			info;
65b4fdde6dSAsias He 	struct net_dev_operations	*ops;
669a6d73f1SSasha Levin 	struct kvm			*kvm;
678c0ae74dSSasha Levin 
688c0ae74dSSasha Levin 	struct virtio_net_params	*params;
694f56d42cSAsias He };
704f56d42cSAsias He 
719a6d73f1SSasha Levin static LIST_HEAD(ndevs);
72312c62d1SSasha Levin static int compat_id = -1;
734f56d42cSAsias He 
747668c3a6SSasha Levin #define MAX_PACKET_SIZE 65550
757668c3a6SSasha Levin 
has_virtio_feature(struct net_dev * ndev,u32 feature)767668c3a6SSasha Levin static bool has_virtio_feature(struct net_dev *ndev, u32 feature)
777668c3a6SSasha Levin {
78902a8ecbSJean-Philippe Brucker 	return ndev->vdev.features & (1 << feature);
797668c3a6SSasha Levin }
807668c3a6SSasha Levin 
virtio_net_hdr_len(struct net_dev * ndev)81b231683cSJean-Philippe Brucker static int virtio_net_hdr_len(struct net_dev *ndev)
82b231683cSJean-Philippe Brucker {
83b231683cSJean-Philippe Brucker 	if (has_virtio_feature(ndev, VIRTIO_NET_F_MRG_RXBUF) ||
84b231683cSJean-Philippe Brucker 	    !ndev->vdev.legacy)
85b231683cSJean-Philippe Brucker 		return sizeof(struct virtio_net_hdr_mrg_rxbuf);
86b231683cSJean-Philippe Brucker 
87b231683cSJean-Philippe Brucker 	return sizeof(struct virtio_net_hdr);
88b231683cSJean-Philippe Brucker }
89b231683cSJean-Philippe Brucker 
virtio_net_rx_thread(void * p)90c4aa7c02SPekka Enberg static void *virtio_net_rx_thread(void *p)
914f56d42cSAsias He {
924f56d42cSAsias He 	struct iovec iov[VIRTIO_NET_QUEUE_SIZE];
93ad96e867SJean-Philippe Brucker 	struct net_dev_queue *queue = p;
94ad96e867SJean-Philippe Brucker 	struct virt_queue *vq = &queue->vq;
95ad96e867SJean-Philippe Brucker 	struct net_dev *ndev = queue->ndev;
9643835ac9SSasha Levin 	struct kvm *kvm;
973fdf659dSSasha Levin 	u16 out, in;
983fdf659dSSasha Levin 	u16 head;
996d6cc14bSWill Deacon 	int len, copied;
1004f56d42cSAsias He 
101a4d8c55eSSasha Levin 	kvm__set_thread_name("virtio-net-rx");
102a4d8c55eSSasha Levin 
1039a6d73f1SSasha Levin 	kvm = ndev->kvm;
104c4aa7c02SPekka Enberg 	while (1) {
105ad96e867SJean-Philippe Brucker 		mutex_lock(&queue->lock);
106c4aa7c02SPekka Enberg 		if (!virt_queue__available(vq))
107ad96e867SJean-Philippe Brucker 			pthread_cond_wait(&queue->cond, &queue->lock.mutex);
108ad96e867SJean-Philippe Brucker 		mutex_unlock(&queue->lock);
1094f56d42cSAsias He 
1104f56d42cSAsias He 		while (virt_queue__available(vq)) {
1117668c3a6SSasha Levin 			unsigned char buffer[MAX_PACKET_SIZE + sizeof(struct virtio_net_hdr_mrg_rxbuf)];
1127668c3a6SSasha Levin 			struct iovec dummy_iov = {
1137668c3a6SSasha Levin 				.iov_base = buffer,
1147668c3a6SSasha Levin 				.iov_len  = sizeof(buffer),
1157668c3a6SSasha Levin 			};
1167668c3a6SSasha Levin 			struct virtio_net_hdr_mrg_rxbuf *hdr;
1173fea89a9SWill Deacon 			u16 num_buffers;
1187f5ffaf5SAsias He 
1197668c3a6SSasha Levin 			len = ndev->ops->rx(&dummy_iov, 1, ndev);
1206d6cc14bSWill Deacon 			if (len < 0) {
1216d6cc14bSWill Deacon 				pr_warning("%s: rx on vq %u failed (%d), exiting thread\n",
122ad96e867SJean-Philippe Brucker 						__func__, queue->id, len);
1236d6cc14bSWill Deacon 				goto out_err;
1246d6cc14bSWill Deacon 			}
1256d6cc14bSWill Deacon 
1263fea89a9SWill Deacon 			copied = num_buffers = 0;
1277668c3a6SSasha Levin 			head = virt_queue__get_iov(vq, iov, &out, &in, kvm);
1288ed60bbeSMarc Zyngier 			hdr = iov[0].iov_base;
1297668c3a6SSasha Levin 			while (copied < len) {
1306d6cc14bSWill Deacon 				size_t iovsize = min_t(size_t, len - copied, iov_size(iov, in));
1317668c3a6SSasha Levin 
132e2493047SAsias He 				memcpy_toiovec(iov, buffer + copied, iovsize);
1337668c3a6SSasha Levin 				copied += iovsize;
1343fea89a9SWill Deacon 				virt_queue__set_used_elem_no_update(vq, head, iovsize, num_buffers++);
1357668c3a6SSasha Levin 				if (copied == len)
1367668c3a6SSasha Levin 					break;
1377668c3a6SSasha Levin 				while (!virt_queue__available(vq))
1387668c3a6SSasha Levin 					sleep(0);
1397668c3a6SSasha Levin 				head = virt_queue__get_iov(vq, iov, &out, &in, kvm);
1407668c3a6SSasha Levin 			}
1413fea89a9SWill Deacon 
142b231683cSJean-Philippe Brucker 			/*
143b231683cSJean-Philippe Brucker 			 * The device MUST set num_buffers, except in the case
144b231683cSJean-Philippe Brucker 			 * where the legacy driver did not negotiate
145b231683cSJean-Philippe Brucker 			 * VIRTIO_NET_F_MRG_RXBUF and the field does not exist.
146b231683cSJean-Philippe Brucker 			 */
147b231683cSJean-Philippe Brucker 			if (has_virtio_feature(ndev, VIRTIO_NET_F_MRG_RXBUF) ||
148b231683cSJean-Philippe Brucker 			    !ndev->vdev.legacy)
149b17552eeSAndre Przywara 				hdr->num_buffers = virtio_host_to_guest_u16(vq->endian, num_buffers);
1503fea89a9SWill Deacon 
1513fea89a9SWill Deacon 			virt_queue__used_idx_advance(vq, num_buffers);
1523fea89a9SWill Deacon 
153c4aa7c02SPekka Enberg 			/* We should interrupt guest right now, otherwise latency is huge. */
1546585ffb7SSasha Levin 			if (virtio_queue__should_signal(vq))
155ad96e867SJean-Philippe Brucker 				ndev->vdev.ops->signal_vq(kvm, &ndev->vdev, queue->id);
1564f56d42cSAsias He 		}
157c4aa7c02SPekka Enberg 	}
158c4aa7c02SPekka Enberg 
1596d6cc14bSWill Deacon out_err:
160c4aa7c02SPekka Enberg 	pthread_exit(NULL);
161c4aa7c02SPekka Enberg 	return NULL;
162c4aa7c02SPekka Enberg 
163c4aa7c02SPekka Enberg }
164c4aa7c02SPekka Enberg 
virtio_net_tx_thread(void * p)165c4aa7c02SPekka Enberg static void *virtio_net_tx_thread(void *p)
1664f56d42cSAsias He {
1674f56d42cSAsias He 	struct iovec iov[VIRTIO_NET_QUEUE_SIZE];
168ad96e867SJean-Philippe Brucker 	struct net_dev_queue *queue = p;
169ad96e867SJean-Philippe Brucker 	struct virt_queue *vq = &queue->vq;
170ad96e867SJean-Philippe Brucker 	struct net_dev *ndev = queue->ndev;
17143835ac9SSasha Levin 	struct kvm *kvm;
1723fdf659dSSasha Levin 	u16 out, in;
1733fdf659dSSasha Levin 	u16 head;
1744f56d42cSAsias He 	int len;
1754f56d42cSAsias He 
176a4d8c55eSSasha Levin 	kvm__set_thread_name("virtio-net-tx");
177a4d8c55eSSasha Levin 
1789a6d73f1SSasha Levin 	kvm = ndev->kvm;
179c4aa7c02SPekka Enberg 
180c4aa7c02SPekka Enberg 	while (1) {
181ad96e867SJean-Philippe Brucker 		mutex_lock(&queue->lock);
182c4aa7c02SPekka Enberg 		if (!virt_queue__available(vq))
183ad96e867SJean-Philippe Brucker 			pthread_cond_wait(&queue->cond, &queue->lock.mutex);
184ad96e867SJean-Philippe Brucker 		mutex_unlock(&queue->lock);
1854f56d42cSAsias He 
1864f56d42cSAsias He 		while (virt_queue__available(vq)) {
18743835ac9SSasha Levin 			head = virt_queue__get_iov(vq, iov, &out, &in, kvm);
1889a6d73f1SSasha Levin 			len = ndev->ops->tx(iov, out, ndev);
1896d6cc14bSWill Deacon 			if (len < 0) {
1906d6cc14bSWill Deacon 				pr_warning("%s: tx on vq %u failed (%d)\n",
191ad96e867SJean-Philippe Brucker 						__func__, queue->id, errno);
1926d6cc14bSWill Deacon 				goto out_err;
1936d6cc14bSWill Deacon 			}
1946d6cc14bSWill Deacon 
1954f56d42cSAsias He 			virt_queue__set_used_elem(vq, head, len);
1964f56d42cSAsias He 		}
1974f56d42cSAsias He 
1986585ffb7SSasha Levin 		if (virtio_queue__should_signal(vq))
199ad96e867SJean-Philippe Brucker 			ndev->vdev.ops->signal_vq(kvm, &ndev->vdev, queue->id);
2004f56d42cSAsias He 	}
2014f56d42cSAsias He 
2026d6cc14bSWill Deacon out_err:
203c4aa7c02SPekka Enberg 	pthread_exit(NULL);
204c4aa7c02SPekka Enberg 	return NULL;
205c4aa7c02SPekka Enberg }
206407475bfSPekka Enberg 
virtio_net_handle_mq(struct kvm * kvm,struct net_dev * ndev,struct virtio_net_ctrl_hdr * ctrl)2076585ffb7SSasha Levin static virtio_net_ctrl_ack virtio_net_handle_mq(struct kvm* kvm, struct net_dev *ndev, struct virtio_net_ctrl_hdr *ctrl)
2086585ffb7SSasha Levin {
2096585ffb7SSasha Levin 	/* Not much to do here */
2106585ffb7SSasha Levin 	return VIRTIO_NET_OK;
2116585ffb7SSasha Levin }
2126585ffb7SSasha Levin 
virtio_net_ctrl_thread(void * p)2136585ffb7SSasha Levin static void *virtio_net_ctrl_thread(void *p)
214abd4a801SSasha Levin {
215abd4a801SSasha Levin 	struct iovec iov[VIRTIO_NET_QUEUE_SIZE];
216ad96e867SJean-Philippe Brucker 	struct net_dev_queue *queue = p;
217ad96e867SJean-Philippe Brucker 	struct virt_queue *vq = &queue->vq;
218ad96e867SJean-Philippe Brucker 	struct net_dev *ndev = queue->ndev;
219abd4a801SSasha Levin 	u16 out, in, head;
2206585ffb7SSasha Levin 	struct kvm *kvm = ndev->kvm;
2216daffe57SJean-Philippe Brucker 	struct virtio_net_ctrl_hdr ctrl;
2226daffe57SJean-Philippe Brucker 	virtio_net_ctrl_ack ack;
2236daffe57SJean-Philippe Brucker 	size_t len;
224abd4a801SSasha Levin 
225edb4a8a0SSuzuki K. Poulose 	kvm__set_thread_name("virtio-net-ctrl");
226edb4a8a0SSuzuki K. Poulose 
2276585ffb7SSasha Levin 	while (1) {
228ad96e867SJean-Philippe Brucker 		mutex_lock(&queue->lock);
2296585ffb7SSasha Levin 		if (!virt_queue__available(vq))
230ad96e867SJean-Philippe Brucker 			pthread_cond_wait(&queue->cond, &queue->lock.mutex);
231ad96e867SJean-Philippe Brucker 		mutex_unlock(&queue->lock);
2326585ffb7SSasha Levin 
2336585ffb7SSasha Levin 		while (virt_queue__available(vq)) {
234ad96e867SJean-Philippe Brucker 			head = virt_queue__get_iov(vq, iov, &out, &in, kvm);
2356daffe57SJean-Philippe Brucker 			len = min(iov_size(iov, in), sizeof(ctrl));
2366daffe57SJean-Philippe Brucker 			memcpy_fromiovec((void *)&ctrl, iov, len);
237abd4a801SSasha Levin 
2386daffe57SJean-Philippe Brucker 			switch (ctrl.class) {
2396585ffb7SSasha Levin 			case VIRTIO_NET_CTRL_MQ:
2406daffe57SJean-Philippe Brucker 				ack = virtio_net_handle_mq(kvm, ndev, &ctrl);
2416585ffb7SSasha Levin 				break;
242abd4a801SSasha Levin 			default:
2436daffe57SJean-Philippe Brucker 				ack = VIRTIO_NET_ERR;
244abd4a801SSasha Levin 				break;
245abd4a801SSasha Levin 			}
2466daffe57SJean-Philippe Brucker 			memcpy_toiovec(iov + in, &ack, sizeof(ack));
2476daffe57SJean-Philippe Brucker 			virt_queue__set_used_elem(vq, head, sizeof(ack));
2486585ffb7SSasha Levin 		}
249abd4a801SSasha Levin 
250ad96e867SJean-Philippe Brucker 		if (virtio_queue__should_signal(vq))
251ad96e867SJean-Philippe Brucker 			ndev->vdev.ops->signal_vq(kvm, &ndev->vdev, queue->id);
2526585ffb7SSasha Levin 	}
253abd4a801SSasha Levin 
2546585ffb7SSasha Levin 	pthread_exit(NULL);
255abd4a801SSasha Levin 
2566585ffb7SSasha Levin 	return NULL;
257abd4a801SSasha Levin }
258abd4a801SSasha Levin 
virtio_net_handle_callback(struct kvm * kvm,struct net_dev * ndev,int queue)2599a6d73f1SSasha Levin static void virtio_net_handle_callback(struct kvm *kvm, struct net_dev *ndev, int queue)
2604f56d42cSAsias He {
261ad96e867SJean-Philippe Brucker 	struct net_dev_queue *net_queue = &ndev->queues[queue];
262ad96e867SJean-Philippe Brucker 
26379052597SSasha Levin 	if ((u32)queue >= (ndev->queue_pairs * 2 + 1)) {
2649a6d73f1SSasha Levin 		pr_warning("Unknown queue index %u", queue);
2656585ffb7SSasha Levin 		return;
266c4aa7c02SPekka Enberg 	}
2676585ffb7SSasha Levin 
268ad96e867SJean-Philippe Brucker 	mutex_lock(&net_queue->lock);
269ad96e867SJean-Philippe Brucker 	pthread_cond_signal(&net_queue->cond);
270ad96e867SJean-Philippe Brucker 	mutex_unlock(&net_queue->lock);
2714f56d42cSAsias He }
2724f56d42cSAsias He 
virtio_net_request_tap(struct net_dev * ndev,struct ifreq * ifr,const char * tapname)273d2a7ddffSMarc Zyngier static int virtio_net_request_tap(struct net_dev *ndev, struct ifreq *ifr,
274d2a7ddffSMarc Zyngier 				  const char *tapname)
275d2a7ddffSMarc Zyngier {
276d2a7ddffSMarc Zyngier 	int ret;
277d2a7ddffSMarc Zyngier 
278d2a7ddffSMarc Zyngier 	memset(ifr, 0, sizeof(*ifr));
279d2a7ddffSMarc Zyngier 	ifr->ifr_flags = IFF_TAP | IFF_NO_PI | IFF_VNET_HDR;
280d2a7ddffSMarc Zyngier 	if (tapname)
28105755b29SAndre Przywara 		strlcpy(ifr->ifr_name, tapname, sizeof(ifr->ifr_name));
282d2a7ddffSMarc Zyngier 
283f83dc816SAndreas Herrmann 	ret = ioctl(ndev->tap_fd, TUNSETIFF, ifr);
284d2a7ddffSMarc Zyngier 
285d2a7ddffSMarc Zyngier 	if (ret >= 0)
28605755b29SAndre Przywara 		strlcpy(ndev->tap_name, ifr->ifr_name, sizeof(ndev->tap_name));
287d2a7ddffSMarc Zyngier 	return ret;
288d2a7ddffSMarc Zyngier }
289d2a7ddffSMarc Zyngier 
virtio_net_exec_script(const char * script,const char * tap_name)290eef27ae3SFan Du static int virtio_net_exec_script(const char* script, const char *tap_name)
291eef27ae3SFan Du {
292eef27ae3SFan Du 	pid_t pid;
293eef27ae3SFan Du 	int status;
294eef27ae3SFan Du 
2959987a37cSSuzuki K Poulose 	pid = vfork();
296eef27ae3SFan Du 	if (pid == 0) {
297eef27ae3SFan Du 		execl(script, script, tap_name, NULL);
298eef27ae3SFan Du 		_exit(1);
299eef27ae3SFan Du 	} else {
300eef27ae3SFan Du 		waitpid(pid, &status, 0);
301eef27ae3SFan Du 		if (WIFEXITED(status) && WEXITSTATUS(status) != 0) {
302eef27ae3SFan Du 			pr_warning("Fail to setup tap by %s", script);
303eef27ae3SFan Du 			return -1;
304eef27ae3SFan Du 		}
305eef27ae3SFan Du 	}
306eef27ae3SFan Du 	return 0;
307eef27ae3SFan Du }
308eef27ae3SFan Du 
virtio_net__tap_init(struct net_dev * ndev)3098c0ae74dSSasha Levin static bool virtio_net__tap_init(struct net_dev *ndev)
3104f56d42cSAsias He {
311cb7202c1SSasha Levin 	int sock = socket(AF_INET, SOCK_STREAM, 0);
31259ee54ebSWei Chen 	int hdr_len;
313cb7202c1SSasha Levin 	struct sockaddr_in sin = {0};
314246c8347SAsias He 	struct ifreq ifr;
3158c0ae74dSSasha Levin 	const struct virtio_net_params *params = ndev->params;
3161dfc7c24SMarc Zyngier 	bool skipconf = !!params->tapif;
3174f56d42cSAsias He 
318b231683cSJean-Philippe Brucker 	hdr_len = virtio_net_hdr_len(ndev);
3199a6d73f1SSasha Levin 	if (ioctl(ndev->tap_fd, TUNSETVNETHDRSZ, &hdr_len) < 0)
3204542f276SCyrill Gorcunov 		pr_warning("Config tap device TUNSETVNETHDRSZ error");
321246c8347SAsias He 
32273b7d038SAmos Kong 	if (strcmp(params->script, "none")) {
323eef27ae3SFan Du 		if (virtio_net_exec_script(params->script, ndev->tap_name) < 0)
32473b7d038SAmos Kong 			goto fail;
3251dfc7c24SMarc Zyngier 	} else if (!skipconf) {
326cb7202c1SSasha Levin 		memset(&ifr, 0, sizeof(ifr));
32716509081SAnisse Astier 		strncpy(ifr.ifr_name, ndev->tap_name, sizeof(ifr.ifr_name));
328bdfcfca6SSasha Levin 		sin.sin_addr.s_addr = inet_addr(params->host_ip);
329cb7202c1SSasha Levin 		memcpy(&(ifr.ifr_addr), &sin, sizeof(ifr.ifr_addr));
330cb7202c1SSasha Levin 		ifr.ifr_addr.sa_family = AF_INET;
3313b02f580SSasha Levin 		if (ioctl(sock, SIOCSIFADDR, &ifr) < 0) {
3324542f276SCyrill Gorcunov 			pr_warning("Could not set ip address on tap device");
3333b02f580SSasha Levin 			goto fail;
3343b02f580SSasha Levin 		}
33573b7d038SAmos Kong 	}
336cb7202c1SSasha Levin 
3371dfc7c24SMarc Zyngier 	if (!skipconf) {
338cb7202c1SSasha Levin 		memset(&ifr, 0, sizeof(ifr));
33916509081SAnisse Astier 		strncpy(ifr.ifr_name, ndev->tap_name, sizeof(ifr.ifr_name));
340cb7202c1SSasha Levin 		ioctl(sock, SIOCGIFFLAGS, &ifr);
341cb7202c1SSasha Levin 		ifr.ifr_flags |= IFF_UP | IFF_RUNNING;
342cb7202c1SSasha Levin 		if (ioctl(sock, SIOCSIFFLAGS, &ifr) < 0)
3434542f276SCyrill Gorcunov 			pr_warning("Could not bring tap device up");
3441dfc7c24SMarc Zyngier 	}
345cb7202c1SSasha Levin 
346cb7202c1SSasha Levin 	close(sock);
3473b02f580SSasha Levin 
3483b02f580SSasha Levin 	return 1;
3493b02f580SSasha Levin 
3503b02f580SSasha Levin fail:
3513b02f580SSasha Levin 	if (sock >= 0)
3523b02f580SSasha Levin 		close(sock);
3539a6d73f1SSasha Levin 	if (ndev->tap_fd >= 0)
3549a6d73f1SSasha Levin 		close(ndev->tap_fd);
3553b02f580SSasha Levin 
3563b02f580SSasha Levin 	return 0;
3574f56d42cSAsias He }
3584f56d42cSAsias He 
virtio_net__tap_exit(struct net_dev * ndev)35949bada43SJean-Philippe Brucker static void virtio_net__tap_exit(struct net_dev *ndev)
36049bada43SJean-Philippe Brucker {
36149bada43SJean-Philippe Brucker 	int sock;
36249bada43SJean-Philippe Brucker 	struct ifreq ifr;
36349bada43SJean-Philippe Brucker 
36449bada43SJean-Philippe Brucker 	if (ndev->params->tapif)
36549bada43SJean-Philippe Brucker 		return;
36649bada43SJean-Philippe Brucker 
36749bada43SJean-Philippe Brucker 	sock = socket(AF_INET, SOCK_STREAM, 0);
36816509081SAnisse Astier 	strncpy(ifr.ifr_name, ndev->tap_name, sizeof(ifr.ifr_name));
36949bada43SJean-Philippe Brucker 	ioctl(sock, SIOCGIFFLAGS, &ifr);
37049bada43SJean-Philippe Brucker 	ifr.ifr_flags &= ~(IFF_UP | IFF_RUNNING);
37149bada43SJean-Philippe Brucker 	if (ioctl(sock, SIOCGIFFLAGS, &ifr) < 0)
37249bada43SJean-Philippe Brucker 		pr_warning("Count not bring tap device down");
37349bada43SJean-Philippe Brucker 	close(sock);
37449bada43SJean-Philippe Brucker }
37549bada43SJean-Philippe Brucker 
virtio_net__tap_create(struct net_dev * ndev)37659ee54ebSWei Chen static bool virtio_net__tap_create(struct net_dev *ndev)
37759ee54ebSWei Chen {
37859ee54ebSWei Chen 	int offload;
37959ee54ebSWei Chen 	struct ifreq ifr;
38059ee54ebSWei Chen 	const struct virtio_net_params *params = ndev->params;
38159ee54ebSWei Chen 	bool macvtap = (!!params->tapif) && (params->tapif[0] == '/');
38259ee54ebSWei Chen 
38359ee54ebSWei Chen 	/* Did the user already gave us the FD? */
38459ee54ebSWei Chen 	if (params->fd)
38559ee54ebSWei Chen 		ndev->tap_fd = params->fd;
38659ee54ebSWei Chen 	else {
38759ee54ebSWei Chen 		const char *tap_file = "/dev/net/tun";
38859ee54ebSWei Chen 
38959ee54ebSWei Chen 		/* Did the user ask us to use macvtap? */
39059ee54ebSWei Chen 		if (macvtap)
39159ee54ebSWei Chen 			tap_file = params->tapif;
39259ee54ebSWei Chen 
39359ee54ebSWei Chen 		ndev->tap_fd = open(tap_file, O_RDWR);
39459ee54ebSWei Chen 		if (ndev->tap_fd < 0) {
39559ee54ebSWei Chen 			pr_warning("Unable to open %s", tap_file);
39659ee54ebSWei Chen 			return 0;
39759ee54ebSWei Chen 		}
39859ee54ebSWei Chen 	}
39959ee54ebSWei Chen 
40059ee54ebSWei Chen 	if (!macvtap &&
40159ee54ebSWei Chen 	    virtio_net_request_tap(ndev, &ifr, params->tapif) < 0) {
40259ee54ebSWei Chen 		pr_warning("Config tap device error. Are you root?");
40359ee54ebSWei Chen 		goto fail;
40459ee54ebSWei Chen 	}
40559ee54ebSWei Chen 
40659ee54ebSWei Chen 	/*
40759ee54ebSWei Chen 	 * The UFO support had been removed from kernel in commit:
40859ee54ebSWei Chen 	 * ID: fb652fdfe83710da0ca13448a41b7ed027d0a984
40959ee54ebSWei Chen 	 * https://www.spinics.net/lists/netdev/msg443562.html
41059ee54ebSWei Chen 	 * In oder to support the older kernels without this commit,
41159ee54ebSWei Chen 	 * we set the TUN_F_UFO to offload by default to test the status of
41259ee54ebSWei Chen 	 * UFO kernel support.
41359ee54ebSWei Chen 	 */
41459ee54ebSWei Chen 	ndev->tap_ufo = true;
41559ee54ebSWei Chen 	offload = TUN_F_CSUM | TUN_F_TSO4 | TUN_F_TSO6 | TUN_F_UFO;
41659ee54ebSWei Chen 	if (ioctl(ndev->tap_fd, TUNSETOFFLOAD, offload) < 0) {
41759ee54ebSWei Chen 		/*
41859ee54ebSWei Chen 		 * Is this failure caused by kernel remove the UFO support?
41959ee54ebSWei Chen 		 * Try TUNSETOFFLOAD without TUN_F_UFO.
42059ee54ebSWei Chen 		 */
42159ee54ebSWei Chen 		offload &= ~TUN_F_UFO;
42259ee54ebSWei Chen 		if (ioctl(ndev->tap_fd, TUNSETOFFLOAD, offload) < 0) {
42359ee54ebSWei Chen 			pr_warning("Config tap device TUNSETOFFLOAD error");
42459ee54ebSWei Chen 			goto fail;
42559ee54ebSWei Chen 		}
42659ee54ebSWei Chen 		ndev->tap_ufo = false;
42759ee54ebSWei Chen 	}
42859ee54ebSWei Chen 
42959ee54ebSWei Chen 	return 1;
43059ee54ebSWei Chen 
43159ee54ebSWei Chen fail:
43259ee54ebSWei Chen 	if ((ndev->tap_fd >= 0) || (!params->fd) )
43359ee54ebSWei Chen 		close(ndev->tap_fd);
43459ee54ebSWei Chen 
43559ee54ebSWei Chen 	return 0;
43659ee54ebSWei Chen }
43759ee54ebSWei Chen 
tap_ops_tx(struct iovec * iov,u16 out,struct net_dev * ndev)438b4fdde6dSAsias He static inline int tap_ops_tx(struct iovec *iov, u16 out, struct net_dev *ndev)
439b4fdde6dSAsias He {
440b4fdde6dSAsias He 	return writev(ndev->tap_fd, iov, out);
441b4fdde6dSAsias He }
442b4fdde6dSAsias He 
tap_ops_rx(struct iovec * iov,u16 in,struct net_dev * ndev)443b4fdde6dSAsias He static inline int tap_ops_rx(struct iovec *iov, u16 in, struct net_dev *ndev)
444b4fdde6dSAsias He {
445b4fdde6dSAsias He 	return readv(ndev->tap_fd, iov, in);
446b4fdde6dSAsias He }
447b4fdde6dSAsias He 
uip_ops_tx(struct iovec * iov,u16 out,struct net_dev * ndev)448b4fdde6dSAsias He static inline int uip_ops_tx(struct iovec *iov, u16 out, struct net_dev *ndev)
449b4fdde6dSAsias He {
450b4fdde6dSAsias He 	return uip_tx(iov, out, &ndev->info);
451b4fdde6dSAsias He }
452b4fdde6dSAsias He 
uip_ops_rx(struct iovec * iov,u16 in,struct net_dev * ndev)453b4fdde6dSAsias He static inline int uip_ops_rx(struct iovec *iov, u16 in, struct net_dev *ndev)
454b4fdde6dSAsias He {
455b4fdde6dSAsias He 	return uip_rx(iov, in, &ndev->info);
456b4fdde6dSAsias He }
457b4fdde6dSAsias He 
458b4fdde6dSAsias He static struct net_dev_operations tap_ops = {
459b4fdde6dSAsias He 	.rx	= tap_ops_rx,
460b4fdde6dSAsias He 	.tx	= tap_ops_tx,
461b4fdde6dSAsias He };
462b4fdde6dSAsias He 
463b4fdde6dSAsias He static struct net_dev_operations uip_ops = {
464b4fdde6dSAsias He 	.rx	= uip_ops_rx,
465b4fdde6dSAsias He 	.tx	= uip_ops_tx,
466b4fdde6dSAsias He };
467b4fdde6dSAsias He 
get_config(struct kvm * kvm,void * dev)468c5ae742bSSasha Levin static u8 *get_config(struct kvm *kvm, void *dev)
46978a2a3e2SSasha Levin {
47078a2a3e2SSasha Levin 	struct net_dev *ndev = dev;
47178a2a3e2SSasha Levin 
472c5ae742bSSasha Levin 	return ((u8 *)(&ndev->config));
47378a2a3e2SSasha Levin }
47478a2a3e2SSasha Levin 
get_config_size(struct kvm * kvm,void * dev)475e4730284SMartin Radev static size_t get_config_size(struct kvm *kvm, void *dev)
476e4730284SMartin Radev {
477e4730284SMartin Radev 	struct net_dev *ndev = dev;
478e4730284SMartin Radev 
479e4730284SMartin Radev 	return sizeof(ndev->config);
480e4730284SMartin Radev }
481e4730284SMartin Radev 
get_host_features(struct kvm * kvm,void * dev)4823c8f82b8SJean-Philippe Brucker static u64 get_host_features(struct kvm *kvm, void *dev)
48378a2a3e2SSasha Levin {
4843c8f82b8SJean-Philippe Brucker 	u64 features;
48579052597SSasha Levin 	struct net_dev *ndev = dev;
48679052597SSasha Levin 
48759ee54ebSWei Chen 	features = 1UL << VIRTIO_NET_F_MAC
48878a2a3e2SSasha Levin 		| 1UL << VIRTIO_NET_F_CSUM
48978a2a3e2SSasha Levin 		| 1UL << VIRTIO_NET_F_HOST_TSO4
49078a2a3e2SSasha Levin 		| 1UL << VIRTIO_NET_F_HOST_TSO6
49178a2a3e2SSasha Levin 		| 1UL << VIRTIO_NET_F_GUEST_TSO4
49292c1f37bSSasha Levin 		| 1UL << VIRTIO_NET_F_GUEST_TSO6
493754c8ce3SSasha Levin 		| 1UL << VIRTIO_RING_F_EVENT_IDX
494abd4a801SSasha Levin 		| 1UL << VIRTIO_RING_F_INDIRECT_DESC
4956585ffb7SSasha Levin 		| 1UL << VIRTIO_NET_F_CTRL_VQ
4967668c3a6SSasha Levin 		| 1UL << VIRTIO_NET_F_MRG_RXBUF
4976daffe57SJean-Philippe Brucker 		| 1UL << (ndev->queue_pairs > 1 ? VIRTIO_NET_F_MQ : 0)
4986daffe57SJean-Philippe Brucker 		| 1UL << VIRTIO_F_ANY_LAYOUT;
49959ee54ebSWei Chen 
50059ee54ebSWei Chen 	/*
50159ee54ebSWei Chen 	 * The UFO feature for host and guest only can be enabled when the
50259ee54ebSWei Chen 	 * kernel has TAP UFO support.
50359ee54ebSWei Chen 	 */
50459ee54ebSWei Chen 	if (ndev->tap_ufo)
50559ee54ebSWei Chen 		features |= (1UL << VIRTIO_NET_F_HOST_UFO
50659ee54ebSWei Chen 				| 1UL << VIRTIO_NET_F_GUEST_UFO);
50759ee54ebSWei Chen 
50853171d59SJean-Philippe Brucker 	if (ndev->vhost_fd) {
50915636d5eSYing-Shiuan Pan 		u64 vhost_features;
51015636d5eSYing-Shiuan Pan 
51115636d5eSYing-Shiuan Pan 		if (ioctl(ndev->vhost_fd, VHOST_GET_FEATURES, &vhost_features) != 0)
51215636d5eSYing-Shiuan Pan 			die_perror("VHOST_GET_FEATURES failed");
51315636d5eSYing-Shiuan Pan 
51453171d59SJean-Philippe Brucker 		features &= vhost_features;
51553171d59SJean-Philippe Brucker 	}
51653171d59SJean-Philippe Brucker 
51753171d59SJean-Philippe Brucker 	return features;
51853171d59SJean-Philippe Brucker }
51953171d59SJean-Philippe Brucker 
virtio_net_start(struct net_dev * ndev)52095242e44SJean-Philippe Brucker static void virtio_net_start(struct net_dev *ndev)
52195242e44SJean-Philippe Brucker {
5223b1cdcf9SJean-Philippe Brucker 	/* VHOST_NET_F_VIRTIO_NET_HDR clashes with VIRTIO_F_ANY_LAYOUT! */
5233b1cdcf9SJean-Philippe Brucker 	u64 features = ndev->vdev.features & ~(1UL << VHOST_NET_F_VIRTIO_NET_HDR);
5243b1cdcf9SJean-Philippe Brucker 
5258aa155c4SYing-Shiuan Pan 	if (ndev->mode == NET_MODE_TAP) {
5268aa155c4SYing-Shiuan Pan 		if (!virtio_net__tap_init(ndev))
52759ee54ebSWei Chen 			die_perror("TAP device initialized failed because");
52859ee54ebSWei Chen 
5293b1cdcf9SJean-Philippe Brucker 		if (ndev->vhost_fd && virtio_vhost_set_features(ndev->vhost_fd,
5303b1cdcf9SJean-Philippe Brucker 								features))
53115636d5eSYing-Shiuan Pan 			die_perror("VHOST_SET_FEATURES failed");
5328aa155c4SYing-Shiuan Pan 	} else {
533b231683cSJean-Philippe Brucker 		ndev->info.vnet_hdr_len = virtio_net_hdr_len(ndev);
5348aa155c4SYing-Shiuan Pan 		uip_init(&ndev->info);
5358aa155c4SYing-Shiuan Pan 	}
53678a2a3e2SSasha Levin }
53778a2a3e2SSasha Levin 
virtio_net_stop(struct net_dev * ndev)53849bada43SJean-Philippe Brucker static void virtio_net_stop(struct net_dev *ndev)
53949bada43SJean-Philippe Brucker {
54049bada43SJean-Philippe Brucker 	/* Undo whatever start() did */
54149bada43SJean-Philippe Brucker 	if (ndev->mode == NET_MODE_TAP)
54249bada43SJean-Philippe Brucker 		virtio_net__tap_exit(ndev);
54349bada43SJean-Philippe Brucker 	else
54449bada43SJean-Philippe Brucker 		uip_exit(&ndev->info);
54549bada43SJean-Philippe Brucker }
54649bada43SJean-Philippe Brucker 
virtio_net_update_endian(struct net_dev * ndev)547867b15ccSJean-Philippe Brucker static void virtio_net_update_endian(struct net_dev *ndev)
548867b15ccSJean-Philippe Brucker {
549867b15ccSJean-Philippe Brucker 	struct virtio_net_config *conf = &ndev->config;
550867b15ccSJean-Philippe Brucker 
551b17552eeSAndre Przywara 	conf->status = virtio_host_to_guest_u16(ndev->vdev.endian,
552867b15ccSJean-Philippe Brucker 						VIRTIO_NET_S_LINK_UP);
553b17552eeSAndre Przywara 	conf->max_virtqueue_pairs = virtio_host_to_guest_u16(ndev->vdev.endian,
554867b15ccSJean-Philippe Brucker 							     ndev->queue_pairs);
5558b27bcffSJean-Philippe Brucker 
5568b27bcffSJean-Philippe Brucker 	/* Let TAP know about vnet header endianness */
5578b27bcffSJean-Philippe Brucker 	if (ndev->mode == NET_MODE_TAP &&
5588b27bcffSJean-Philippe Brucker 	    ndev->vdev.endian != VIRTIO_ENDIAN_HOST) {
5598b27bcffSJean-Philippe Brucker 		int enable_val = 1, disable_val = 0;
5608b27bcffSJean-Philippe Brucker 		int enable_req, disable_req;
5618b27bcffSJean-Philippe Brucker 
5628b27bcffSJean-Philippe Brucker 		if (ndev->vdev.endian == VIRTIO_ENDIAN_LE) {
5638b27bcffSJean-Philippe Brucker 			enable_req = TUNSETVNETLE;
5648b27bcffSJean-Philippe Brucker 			disable_req = TUNSETVNETBE;
5658b27bcffSJean-Philippe Brucker 		} else {
5668b27bcffSJean-Philippe Brucker 			enable_req = TUNSETVNETBE;
5678b27bcffSJean-Philippe Brucker 			disable_req = TUNSETVNETLE;
5688b27bcffSJean-Philippe Brucker 		}
5698b27bcffSJean-Philippe Brucker 
5708b27bcffSJean-Philippe Brucker 		ioctl(ndev->tap_fd, disable_req, &disable_val);
5718b27bcffSJean-Philippe Brucker 		if (ioctl(ndev->tap_fd, enable_req, &enable_val) < 0)
5728b27bcffSJean-Philippe Brucker 			pr_err("Config tap device TUNSETVNETLE/BE error");
5738b27bcffSJean-Philippe Brucker 	}
574867b15ccSJean-Philippe Brucker }
575867b15ccSJean-Philippe Brucker 
notify_status(struct kvm * kvm,void * dev,u32 status)57695242e44SJean-Philippe Brucker static void notify_status(struct kvm *kvm, void *dev, u32 status)
57795242e44SJean-Philippe Brucker {
578867b15ccSJean-Philippe Brucker 	struct net_dev *ndev = dev;
579867b15ccSJean-Philippe Brucker 
580867b15ccSJean-Philippe Brucker 	if (status & VIRTIO__STATUS_CONFIG)
581867b15ccSJean-Philippe Brucker 		virtio_net_update_endian(ndev);
582867b15ccSJean-Philippe Brucker 
58395242e44SJean-Philippe Brucker 	if (status & VIRTIO__STATUS_START)
58495242e44SJean-Philippe Brucker 		virtio_net_start(dev);
58549bada43SJean-Philippe Brucker 	else if (status & VIRTIO__STATUS_STOP)
58649bada43SJean-Philippe Brucker 		virtio_net_stop(dev);
58795242e44SJean-Philippe Brucker }
58895242e44SJean-Philippe Brucker 
is_ctrl_vq(struct net_dev * ndev,u32 vq)5899e56ec14SSasha Levin static bool is_ctrl_vq(struct net_dev *ndev, u32 vq)
5909e56ec14SSasha Levin {
5919e56ec14SSasha Levin 	return vq == (u32)(ndev->queue_pairs * 2);
5929e56ec14SSasha Levin }
5939e56ec14SSasha Levin 
init_vq(struct kvm * kvm,void * dev,u32 vq)594609ee906SJean-Philippe Brucker static int init_vq(struct kvm *kvm, void *dev, u32 vq)
59578a2a3e2SSasha Levin {
596de166e5fSJean-Philippe Brucker 	struct vhost_vring_file file = { .index = vq };
597ad96e867SJean-Philippe Brucker 	struct net_dev_queue *net_queue;
59878a2a3e2SSasha Levin 	struct net_dev *ndev = dev;
59978a2a3e2SSasha Levin 	struct virt_queue *queue;
6009ed67cdcSSasha Levin 	int r;
60178a2a3e2SSasha Levin 
602312c62d1SSasha Levin 	compat__remove_message(compat_id);
60378a2a3e2SSasha Levin 
604ad96e867SJean-Philippe Brucker 	net_queue	= &ndev->queues[vq];
605ad96e867SJean-Philippe Brucker 	net_queue->id	= vq;
606ad96e867SJean-Philippe Brucker 	net_queue->ndev	= ndev;
607ad96e867SJean-Philippe Brucker 	queue		= &net_queue->vq;
608609ee906SJean-Philippe Brucker 	virtio_init_device_vq(kvm, &ndev->vdev, queue, VIRTIO_NET_QUEUE_SIZE);
60978a2a3e2SSasha Levin 
610ad96e867SJean-Philippe Brucker 	mutex_init(&net_queue->lock);
611ad96e867SJean-Philippe Brucker 	pthread_cond_init(&net_queue->cond, NULL);
6129e56ec14SSasha Levin 	if (is_ctrl_vq(ndev, vq)) {
613ad96e867SJean-Philippe Brucker 		pthread_create(&net_queue->thread, NULL, virtio_net_ctrl_thread,
614ad96e867SJean-Philippe Brucker 			       net_queue);
6159e56ec14SSasha Levin 
6169e56ec14SSasha Levin 		return 0;
6179e56ec14SSasha Levin 	} else if (ndev->vhost_fd == 0 ) {
6189e56ec14SSasha Levin 		if (vq & 1)
619ad96e867SJean-Philippe Brucker 			pthread_create(&net_queue->thread, NULL,
620ad96e867SJean-Philippe Brucker 				       virtio_net_tx_thread, net_queue);
6216585ffb7SSasha Levin 		else
622ad96e867SJean-Philippe Brucker 			pthread_create(&net_queue->thread, NULL,
623ad96e867SJean-Philippe Brucker 				       virtio_net_rx_thread, net_queue);
6246585ffb7SSasha Levin 
62578a2a3e2SSasha Levin 		return 0;
6266585ffb7SSasha Levin 	}
6279ed67cdcSSasha Levin 
628745221e5SJean-Philippe Brucker 	virtio_vhost_set_vring(kvm, ndev->vhost_fd, vq, queue);
6299ed67cdcSSasha Levin 
630de166e5fSJean-Philippe Brucker 	file.fd = ndev->tap_fd;
631de166e5fSJean-Philippe Brucker 	r = ioctl(ndev->vhost_fd, VHOST_NET_SET_BACKEND, &file);
632de166e5fSJean-Philippe Brucker 	if (r < 0)
633de166e5fSJean-Philippe Brucker 		die_perror("VHOST_NET_SET_BACKEND failed");
634de166e5fSJean-Philippe Brucker 
6359ed67cdcSSasha Levin 	return 0;
6369ed67cdcSSasha Levin }
6379ed67cdcSSasha Levin 
exit_vq(struct kvm * kvm,void * dev,u32 vq)63849bada43SJean-Philippe Brucker static void exit_vq(struct kvm *kvm, void *dev, u32 vq)
63949bada43SJean-Philippe Brucker {
64049bada43SJean-Philippe Brucker 	struct net_dev *ndev = dev;
64149bada43SJean-Philippe Brucker 	struct net_dev_queue *queue = &ndev->queues[vq];
64249bada43SJean-Philippe Brucker 
643029cd2bbSJean-Philippe Brucker 	virtio_vhost_reset_vring(kvm, ndev->vhost_fd, vq, &queue->vq);
64449bada43SJean-Philippe Brucker 
64549bada43SJean-Philippe Brucker 	/*
64649bada43SJean-Philippe Brucker 	 * TODO: vhost reset owner. It's the only way to cleanly stop vhost, but
64749bada43SJean-Philippe Brucker 	 * we can't restart it at the moment.
64849bada43SJean-Philippe Brucker 	 */
64949bada43SJean-Philippe Brucker 	if (ndev->vhost_fd && !is_ctrl_vq(ndev, vq)) {
65049bada43SJean-Philippe Brucker 		pr_warning("Cannot reset VHOST queue");
65149bada43SJean-Philippe Brucker 		ioctl(ndev->vhost_fd, VHOST_RESET_OWNER);
65249bada43SJean-Philippe Brucker 		return;
65349bada43SJean-Philippe Brucker 	}
65449bada43SJean-Philippe Brucker 
65549bada43SJean-Philippe Brucker 	/*
65649bada43SJean-Philippe Brucker 	 * Threads are waiting on cancellation points (readv or
65749bada43SJean-Philippe Brucker 	 * pthread_cond_wait) and should stop gracefully.
65849bada43SJean-Philippe Brucker 	 */
65949bada43SJean-Philippe Brucker 	pthread_cancel(queue->thread);
66049bada43SJean-Philippe Brucker 	pthread_join(queue->thread, NULL);
66149bada43SJean-Philippe Brucker }
66249bada43SJean-Philippe Brucker 
notify_vq_gsi(struct kvm * kvm,void * dev,u32 vq,u32 gsi)6639ed67cdcSSasha Levin static void notify_vq_gsi(struct kvm *kvm, void *dev, u32 vq, u32 gsi)
6649ed67cdcSSasha Levin {
6659ed67cdcSSasha Levin 	struct net_dev *ndev = dev;
666ad96e867SJean-Philippe Brucker 	struct net_dev_queue *queue = &ndev->queues[vq];
6679ed67cdcSSasha Levin 
668029cd2bbSJean-Philippe Brucker 	if (ndev->vhost_fd == 0 || is_ctrl_vq(ndev, vq))
6699ed67cdcSSasha Levin 		return;
6709ed67cdcSSasha Levin 
67146aaf3b8SJean-Philippe Brucker 	virtio_vhost_set_vring_irqfd(kvm, gsi, &queue->vq);
6729ed67cdcSSasha Levin }
6739ed67cdcSSasha Levin 
notify_vq_eventfd(struct kvm * kvm,void * dev,u32 vq,u32 efd)6749ed67cdcSSasha Levin static void notify_vq_eventfd(struct kvm *kvm, void *dev, u32 vq, u32 efd)
6759ed67cdcSSasha Levin {
6769ed67cdcSSasha Levin 	struct net_dev *ndev = dev;
6779ed67cdcSSasha Levin 
6789e56ec14SSasha Levin 	if (ndev->vhost_fd == 0 || is_ctrl_vq(ndev, vq))
6799ed67cdcSSasha Levin 		return;
6809ed67cdcSSasha Levin 
681676c0c8aSJean-Philippe Brucker 	virtio_vhost_set_vring_kick(kvm, ndev->vhost_fd, vq, efd);
68278a2a3e2SSasha Levin }
68378a2a3e2SSasha Levin 
notify_vq(struct kvm * kvm,void * dev,u32 vq)68478a2a3e2SSasha Levin static int notify_vq(struct kvm *kvm, void *dev, u32 vq)
68578a2a3e2SSasha Levin {
6869a6d73f1SSasha Levin 	struct net_dev *ndev = dev;
6879a6d73f1SSasha Levin 
6889a6d73f1SSasha Levin 	virtio_net_handle_callback(kvm, ndev, vq);
68978a2a3e2SSasha Levin 
69078a2a3e2SSasha Levin 	return 0;
69178a2a3e2SSasha Levin }
69278a2a3e2SSasha Levin 
get_vq(struct kvm * kvm,void * dev,u32 vq)69353fbb17bSJean-Philippe Brucker static struct virt_queue *get_vq(struct kvm *kvm, void *dev, u32 vq)
69478a2a3e2SSasha Levin {
69578a2a3e2SSasha Levin 	struct net_dev *ndev = dev;
69678a2a3e2SSasha Levin 
697ad96e867SJean-Philippe Brucker 	return &ndev->queues[vq].vq;
69878a2a3e2SSasha Levin }
69978a2a3e2SSasha Levin 
get_size_vq(struct kvm * kvm,void * dev,u32 vq)70078a2a3e2SSasha Levin static int get_size_vq(struct kvm *kvm, void *dev, u32 vq)
70178a2a3e2SSasha Levin {
7020f4f51a8SAsias He 	/* FIXME: dynamic */
70378a2a3e2SSasha Levin 	return VIRTIO_NET_QUEUE_SIZE;
70478a2a3e2SSasha Levin }
70578a2a3e2SSasha Levin 
set_size_vq(struct kvm * kvm,void * dev,u32 vq,int size)7060f4f51a8SAsias He static int set_size_vq(struct kvm *kvm, void *dev, u32 vq, int size)
7070f4f51a8SAsias He {
7080f4f51a8SAsias He 	/* FIXME: dynamic */
7090f4f51a8SAsias He 	return size;
7100f4f51a8SAsias He }
7110f4f51a8SAsias He 
get_vq_count(struct kvm * kvm,void * dev)71231e0eaccSMartin Radev static unsigned int get_vq_count(struct kvm *kvm, void *dev)
713b98ac591SJean-Philippe Brucker {
714b98ac591SJean-Philippe Brucker 	struct net_dev *ndev = dev;
715b98ac591SJean-Philippe Brucker 
716b98ac591SJean-Philippe Brucker 	return ndev->queue_pairs * 2 + 1;
717b98ac591SJean-Philippe Brucker }
718b98ac591SJean-Philippe Brucker 
71915542babSAndre Przywara static struct virtio_ops net_dev_virtio_ops = {
7201c47ce69SSasha Levin 	.get_config		= get_config,
721e4730284SMartin Radev 	.get_config_size	= get_config_size,
7221c47ce69SSasha Levin 	.get_host_features	= get_host_features,
723b98ac591SJean-Philippe Brucker 	.get_vq_count		= get_vq_count,
7241c47ce69SSasha Levin 	.init_vq		= init_vq,
72549bada43SJean-Philippe Brucker 	.exit_vq		= exit_vq,
72653fbb17bSJean-Philippe Brucker 	.get_vq			= get_vq,
7271c47ce69SSasha Levin 	.get_size_vq		= get_size_vq,
7280f4f51a8SAsias He 	.set_size_vq		= set_size_vq,
7290f4f51a8SAsias He 	.notify_vq		= notify_vq,
7309ed67cdcSSasha Levin 	.notify_vq_gsi		= notify_vq_gsi,
7319ed67cdcSSasha Levin 	.notify_vq_eventfd	= notify_vq_eventfd,
73295242e44SJean-Philippe Brucker 	.notify_status		= notify_status,
7331c47ce69SSasha Levin };
7341c47ce69SSasha Levin 
virtio_net__vhost_init(struct kvm * kvm,struct net_dev * ndev)7359ed67cdcSSasha Levin static void virtio_net__vhost_init(struct kvm *kvm, struct net_dev *ndev)
7369ed67cdcSSasha Levin {
7373a70ab1eSJean-Philippe Brucker 	if (ndev->queue_pairs > 1) {
7383a70ab1eSJean-Philippe Brucker 		pr_warning("multiqueue is not supported with vhost yet");
7393a70ab1eSJean-Philippe Brucker 		return;
7403a70ab1eSJean-Philippe Brucker 	}
7413a70ab1eSJean-Philippe Brucker 
7429ed67cdcSSasha Levin 	ndev->vhost_fd = open("/dev/vhost-net", O_RDWR);
7439ed67cdcSSasha Levin 	if (ndev->vhost_fd < 0)
7449ed67cdcSSasha Levin 		die_perror("Failed openning vhost-net device");
7459ed67cdcSSasha Levin 
746f84ab9ebSJean-Philippe Brucker 	virtio_vhost_init(kvm, ndev->vhost_fd);
747627d6874SAsias He 
748627d6874SAsias He 	ndev->vdev.use_vhost = true;
7499ed67cdcSSasha Levin }
7509ed67cdcSSasha Levin 
str_to_mac(const char * str,char * mac)7515f225124SSasha Levin static inline void str_to_mac(const char *str, char *mac)
7525f225124SSasha Levin {
7535f225124SSasha Levin 	sscanf(str, "%hhx:%hhx:%hhx:%hhx:%hhx:%hhx",
7545f225124SSasha Levin 		mac, mac+1, mac+2, mac+3, mac+4, mac+5);
7555f225124SSasha Levin }
set_net_param(struct kvm * kvm,struct virtio_net_params * p,const char * param,const char * val)7564346fd8fSSasha Levin static int set_net_param(struct kvm *kvm, struct virtio_net_params *p,
7574346fd8fSSasha Levin 			const char *param, const char *val)
7585f225124SSasha Levin {
7595f225124SSasha Levin 	if (strcmp(param, "guest_mac") == 0) {
7605f225124SSasha Levin 		str_to_mac(val, p->guest_mac);
7615f225124SSasha Levin 	} else if (strcmp(param, "mode") == 0) {
7625f225124SSasha Levin 		if (!strncmp(val, "user", 4)) {
7635f225124SSasha Levin 			int i;
7645f225124SSasha Levin 
7655f225124SSasha Levin 			for (i = 0; i < kvm->cfg.num_net_devices; i++)
7665f225124SSasha Levin 				if (kvm->cfg.net_params[i].mode == NET_MODE_USER)
7675f225124SSasha Levin 					die("Only one usermode network device allowed at a time");
7685f225124SSasha Levin 			p->mode = NET_MODE_USER;
7695f225124SSasha Levin 		} else if (!strncmp(val, "tap", 3)) {
7705f225124SSasha Levin 			p->mode = NET_MODE_TAP;
7715f225124SSasha Levin 		} else if (!strncmp(val, "none", 4)) {
7725f225124SSasha Levin 			kvm->cfg.no_net = 1;
7735f225124SSasha Levin 			return -1;
7745f225124SSasha Levin 		} else
7755f225124SSasha Levin 			die("Unknown network mode %s, please use user, tap or none", kvm->cfg.network);
7765f225124SSasha Levin 	} else if (strcmp(param, "script") == 0) {
7775f225124SSasha Levin 		p->script = strdup(val);
778eef27ae3SFan Du 	} else if (strcmp(param, "downscript") == 0) {
779eef27ae3SFan Du 		p->downscript = strdup(val);
7805f225124SSasha Levin 	} else if (strcmp(param, "guest_ip") == 0) {
7815f225124SSasha Levin 		p->guest_ip = strdup(val);
7825f225124SSasha Levin 	} else if (strcmp(param, "host_ip") == 0) {
7835f225124SSasha Levin 		p->host_ip = strdup(val);
7845f225124SSasha Levin 	} else if (strcmp(param, "trans") == 0) {
7855f225124SSasha Levin 		p->trans = strdup(val);
7861dfc7c24SMarc Zyngier 	} else if (strcmp(param, "tapif") == 0) {
7871dfc7c24SMarc Zyngier 		p->tapif = strdup(val);
7885f225124SSasha Levin 	} else if (strcmp(param, "vhost") == 0) {
7895f225124SSasha Levin 		p->vhost = atoi(val);
7905f225124SSasha Levin 	} else if (strcmp(param, "fd") == 0) {
7915f225124SSasha Levin 		p->fd = atoi(val);
79279052597SSasha Levin 	} else if (strcmp(param, "mq") == 0) {
79379052597SSasha Levin 		p->mq = atoi(val);
7945f225124SSasha Levin 	} else
7955f225124SSasha Levin 		die("Unknown network parameter %s", param);
7965f225124SSasha Levin 
7975f225124SSasha Levin 	return 0;
7985f225124SSasha Levin }
7995f225124SSasha Levin 
netdev_parser(const struct option * opt,const char * arg,int unset)8005f225124SSasha Levin int netdev_parser(const struct option *opt, const char *arg, int unset)
8015f225124SSasha Levin {
8025f225124SSasha Levin 	struct virtio_net_params p;
8035f225124SSasha Levin 	char *buf = NULL, *cmd = NULL, *cur = NULL;
8045f225124SSasha Levin 	bool on_cmd = true;
8055f225124SSasha Levin 	struct kvm *kvm = opt->ptr;
8065f225124SSasha Levin 
8075f225124SSasha Levin 	if (arg) {
8085f225124SSasha Levin 		buf = strdup(arg);
8095f225124SSasha Levin 		if (buf == NULL)
8105f225124SSasha Levin 			die("Failed allocating new net buffer");
8115f225124SSasha Levin 		cur = strtok(buf, ",=");
8125f225124SSasha Levin 	}
8135f225124SSasha Levin 
8145f225124SSasha Levin 	p = (struct virtio_net_params) {
8155f225124SSasha Levin 		.guest_ip	= DEFAULT_GUEST_ADDR,
8165f225124SSasha Levin 		.host_ip	= DEFAULT_HOST_ADDR,
8175f225124SSasha Levin 		.script		= DEFAULT_SCRIPT,
818eef27ae3SFan Du 		.downscript	= DEFAULT_SCRIPT,
8195f225124SSasha Levin 		.mode		= NET_MODE_TAP,
8205f225124SSasha Levin 	};
8215f225124SSasha Levin 
8225f225124SSasha Levin 	str_to_mac(DEFAULT_GUEST_MAC, p.guest_mac);
8235f225124SSasha Levin 	p.guest_mac[5] += kvm->cfg.num_net_devices;
8245f225124SSasha Levin 
8255f225124SSasha Levin 	while (cur) {
8265f225124SSasha Levin 		if (on_cmd) {
8275f225124SSasha Levin 			cmd = cur;
8285f225124SSasha Levin 		} else {
8294346fd8fSSasha Levin 			if (set_net_param(kvm, &p, cmd, cur) < 0)
8305f225124SSasha Levin 				goto done;
8315f225124SSasha Levin 		}
8325f225124SSasha Levin 		on_cmd = !on_cmd;
8335f225124SSasha Levin 
8345f225124SSasha Levin 		cur = strtok(NULL, ",=");
8355f225124SSasha Levin 	};
8365f225124SSasha Levin 
8375f225124SSasha Levin 	kvm->cfg.num_net_devices++;
8385f225124SSasha Levin 
8395f225124SSasha Levin 	kvm->cfg.net_params = realloc(kvm->cfg.net_params, kvm->cfg.num_net_devices * sizeof(*kvm->cfg.net_params));
8405f225124SSasha Levin 	if (kvm->cfg.net_params == NULL)
8415f225124SSasha Levin 		die("Failed adding new network device");
8425f225124SSasha Levin 
8435f225124SSasha Levin 	kvm->cfg.net_params[kvm->cfg.num_net_devices - 1] = p;
8445f225124SSasha Levin 
8455f225124SSasha Levin done:
8465f225124SSasha Levin 	free(buf);
8475f225124SSasha Levin 	return 0;
8485f225124SSasha Levin }
8495f225124SSasha Levin 
virtio_net__init_one(struct virtio_net_params * params)8504498eb74SAlexandru Elisei static int virtio_net__init_one(struct virtio_net_params *params)
8514f56d42cSAsias He {
8529b46ebc5SRajnesh Kanwal 	enum virtio_trans trans = params->kvm->cfg.virtio_transport;
8539a6d73f1SSasha Levin 	struct net_dev *ndev;
85476a4aac6SWill Deacon 	struct virtio_ops *ops;
8559b46ebc5SRajnesh Kanwal 	int i, r;
8569a6d73f1SSasha Levin 
8579a6d73f1SSasha Levin 	ndev = calloc(1, sizeof(struct net_dev));
8589a6d73f1SSasha Levin 	if (ndev == NULL)
8595f225124SSasha Levin 		return -ENOMEM;
8609a6d73f1SSasha Levin 
8619a6d73f1SSasha Levin 	list_add_tail(&ndev->list, &ndevs);
8629a6d73f1SSasha Levin 
863db927775SAlexandru Elisei 	ops = malloc(sizeof(*ops));
864db927775SAlexandru Elisei 	if (ops == NULL)
865db927775SAlexandru Elisei 		return -ENOMEM;
866db927775SAlexandru Elisei 
8679a6d73f1SSasha Levin 	ndev->kvm = params->kvm;
8688c0ae74dSSasha Levin 	ndev->params = params;
8699a6d73f1SSasha Levin 
8709a6d73f1SSasha Levin 	mutex_init(&ndev->mutex);
87179052597SSasha Levin 	ndev->queue_pairs = max(1, min(VIRTIO_NET_NUM_QUEUES, params->mq));
87279052597SSasha Levin 
8730c54698eSAsias He 	for (i = 0 ; i < 6 ; i++) {
8749a6d73f1SSasha Levin 		ndev->config.mac[i]		= params->guest_mac[i];
8759a6d73f1SSasha Levin 		ndev->info.guest_mac.addr[i]	= params->guest_mac[i];
8769a6d73f1SSasha Levin 		ndev->info.host_mac.addr[i]	= params->host_mac[i];
8770c54698eSAsias He 	}
878f715177dSAsias He 
8799a6d73f1SSasha Levin 	ndev->mode = params->mode;
8809a6d73f1SSasha Levin 	if (ndev->mode == NET_MODE_TAP) {
8819a6d73f1SSasha Levin 		ndev->ops = &tap_ops;
88259ee54ebSWei Chen 		if (!virtio_net__tap_create(ndev))
88359ee54ebSWei Chen 			die_perror("You have requested a TAP device, but creation of one has failed because");
884b4fdde6dSAsias He 	} else {
8859a6d73f1SSasha Levin 		ndev->info.host_ip		= ntohl(inet_addr(params->host_ip));
8869a6d73f1SSasha Levin 		ndev->info.guest_ip		= ntohl(inet_addr(params->guest_ip));
8879a6d73f1SSasha Levin 		ndev->info.guest_netmask	= ntohl(inet_addr("255.255.255.0"));
8889a6d73f1SSasha Levin 		ndev->info.buf_nr		= 20,
8899a6d73f1SSasha Levin 		ndev->ops = &uip_ops;
8905f3aaf22SMarc Zyngier 		uip_static_init(&ndev->info);
891b4fdde6dSAsias He 	}
892b5ee1ea7SAsias He 
89376a4aac6SWill Deacon 	*ops = net_dev_virtio_ops;
894dc7a55d6SSuzuki K. Poulose 
895dc7a55d6SSuzuki K. Poulose 	if (params->trans) {
896dc7a55d6SSuzuki K. Poulose 		if (strcmp(params->trans, "mmio") == 0)
897dc7a55d6SSuzuki K. Poulose 			trans = VIRTIO_MMIO;
898dc7a55d6SSuzuki K. Poulose 		else if (strcmp(params->trans, "pci") == 0)
899dc7a55d6SSuzuki K. Poulose 			trans = VIRTIO_PCI;
90069205aa1SAsias He 		else
901dc7a55d6SSuzuki K. Poulose 			pr_warning("virtio-net: Unknown transport method : %s, "
902dc7a55d6SSuzuki K. Poulose 				   "falling back to %s.", params->trans,
903dc7a55d6SSuzuki K. Poulose 				   virtio_trans_name(trans));
904dc7a55d6SSuzuki K. Poulose 	}
905dc7a55d6SSuzuki K. Poulose 
906db927775SAlexandru Elisei 	r = virtio_init(params->kvm, ndev, &ndev->vdev, ops, trans,
90776a4aac6SWill Deacon 			PCI_DEVICE_ID_VIRTIO_NET, VIRTIO_ID_NET, PCI_CLASS_NET);
908db927775SAlexandru Elisei 	if (r < 0) {
909db927775SAlexandru Elisei 		free(ops);
910db927775SAlexandru Elisei 		return r;
911db927775SAlexandru Elisei 	}
91227ab67f5SSasha Levin 
9139ed67cdcSSasha Levin 	if (params->vhost)
9149ed67cdcSSasha Levin 		virtio_net__vhost_init(params->kvm, ndev);
915cb83de6fSSasha Levin 
9164498eb74SAlexandru Elisei 	if (compat_id == -1)
91752f34d2cSAsias He 		compat_id = virtio_compat_add_message("virtio-net", "CONFIG_VIRTIO_NET");
9185f225124SSasha Levin 
9195f225124SSasha Levin 	return 0;
9205f225124SSasha Levin }
9215f225124SSasha Levin 
virtio_net__init(struct kvm * kvm)9225f225124SSasha Levin int virtio_net__init(struct kvm *kvm)
9235f225124SSasha Levin {
924db927775SAlexandru Elisei 	int i, r;
9255f225124SSasha Levin 
9265f225124SSasha Levin 	for (i = 0; i < kvm->cfg.num_net_devices; i++) {
9275f225124SSasha Levin 		kvm->cfg.net_params[i].kvm = kvm;
9284498eb74SAlexandru Elisei 		r = virtio_net__init_one(&kvm->cfg.net_params[i]);
929db927775SAlexandru Elisei 		if (r < 0)
930db927775SAlexandru Elisei 			goto cleanup;
9315f225124SSasha Levin 	}
9325f225124SSasha Levin 
9335f225124SSasha Levin 	if (kvm->cfg.num_net_devices == 0 && kvm->cfg.no_net == 0) {
9348c0ae74dSSasha Levin 		static struct virtio_net_params net_params;
9355f225124SSasha Levin 
9365f225124SSasha Levin 		net_params = (struct virtio_net_params) {
9375f225124SSasha Levin 			.guest_ip	= kvm->cfg.guest_ip,
9385f225124SSasha Levin 			.host_ip	= kvm->cfg.host_ip,
9395f225124SSasha Levin 			.kvm		= kvm,
9405f225124SSasha Levin 			.script		= kvm->cfg.script,
9415f225124SSasha Levin 			.mode		= NET_MODE_USER,
9425f225124SSasha Levin 		};
9435f225124SSasha Levin 		str_to_mac(kvm->cfg.guest_mac, net_params.guest_mac);
9445f225124SSasha Levin 		str_to_mac(kvm->cfg.host_mac, net_params.host_mac);
9455f225124SSasha Levin 
9464498eb74SAlexandru Elisei 		r = virtio_net__init_one(&net_params);
947db927775SAlexandru Elisei 		if (r < 0)
948db927775SAlexandru Elisei 			goto cleanup;
9495f225124SSasha Levin 	}
9505f225124SSasha Levin 
9515f225124SSasha Levin 	return 0;
952db927775SAlexandru Elisei 
953db927775SAlexandru Elisei cleanup:
954db927775SAlexandru Elisei 	virtio_net__exit(kvm);
955db927775SAlexandru Elisei 	return r;
9565f225124SSasha Levin }
95749a8afd1SSasha Levin virtio_dev_init(virtio_net__init);
9585f225124SSasha Levin 
virtio_net__exit(struct kvm * kvm)9595f225124SSasha Levin int virtio_net__exit(struct kvm *kvm)
9605f225124SSasha Levin {
961eef27ae3SFan Du 	struct virtio_net_params *params;
962eef27ae3SFan Du 	struct net_dev *ndev;
963db927775SAlexandru Elisei 	struct list_head *ptr, *n;
964eef27ae3SFan Du 
965db927775SAlexandru Elisei 	list_for_each_safe(ptr, n, &ndevs) {
966eef27ae3SFan Du 		ndev = list_entry(ptr, struct net_dev, list);
967eef27ae3SFan Du 		params = ndev->params;
968eef27ae3SFan Du 		/* Cleanup any tap device which attached to bridge */
969eef27ae3SFan Du 		if (ndev->mode == NET_MODE_TAP &&
970eef27ae3SFan Du 		    strcmp(params->downscript, "none"))
971eef27ae3SFan Du 			virtio_net_exec_script(params->downscript, ndev->tap_name);
972*74af1456SEduardo Bart 		virtio_net_stop(ndev);
973db927775SAlexandru Elisei 
974db927775SAlexandru Elisei 		list_del(&ndev->list);
975*74af1456SEduardo Bart 		virtio_exit(kvm, &ndev->vdev);
976db927775SAlexandru Elisei 		free(ndev);
977eef27ae3SFan Du 	}
978*74af1456SEduardo Bart 
9795f225124SSasha Levin 	return 0;
9804f56d42cSAsias He }
98149a8afd1SSasha Levin virtio_dev_exit(virtio_net__exit);
982