131638bcaSCyrill Gorcunov #include "kvm/virtio-pci-dev.h"
2b5ee1ea7SAsias He #include "kvm/virtio-net.h"
34f56d42cSAsias He #include "kvm/virtio.h"
44f56d42cSAsias He #include "kvm/mutex.h"
54f56d42cSAsias He #include "kvm/util.h"
64f56d42cSAsias He #include "kvm/kvm.h"
7b5ee1ea7SAsias He #include "kvm/uip.h"
8cb83de6fSSasha Levin #include "kvm/guest_compat.h"
97668c3a6SSasha Levin #include "kvm/iovec.h"
1005755b29SAndre Przywara #include "kvm/strbuf.h"
114f56d42cSAsias He
12029cd2bbSJean-Philippe Brucker #include <linux/list.h>
139ed67cdcSSasha Levin #include <linux/vhost.h>
144f56d42cSAsias He #include <linux/virtio_net.h>
154f56d42cSAsias He #include <linux/if_tun.h>
1678a2a3e2SSasha Levin #include <linux/types.h>
17c229370aSIngo Molnar
18c229370aSIngo Molnar #include <arpa/inet.h>
194f56d42cSAsias He #include <net/if.h>
20c229370aSIngo Molnar
21c229370aSIngo Molnar #include <unistd.h>
224f56d42cSAsias He #include <fcntl.h>
23c229370aSIngo Molnar
24cb7202c1SSasha Levin #include <sys/socket.h>
25c229370aSIngo Molnar #include <sys/ioctl.h>
26c229370aSIngo Molnar #include <sys/types.h>
2773b7d038SAmos Kong #include <sys/wait.h>
284f56d42cSAsias He
294059ad8bSAsias He #define VIRTIO_NET_QUEUE_SIZE 256
306585ffb7SSasha Levin #define VIRTIO_NET_NUM_QUEUES 8
314f56d42cSAsias He
32b4fdde6dSAsias He struct net_dev;
33b4fdde6dSAsias He
34b4fdde6dSAsias He struct net_dev_operations {
35b4fdde6dSAsias He int (*rx)(struct iovec *iov, u16 in, struct net_dev *ndev);
36b4fdde6dSAsias He int (*tx)(struct iovec *iov, u16 in, struct net_dev *ndev);
37b4fdde6dSAsias He };
38b4fdde6dSAsias He
39ad96e867SJean-Philippe Brucker struct net_dev_queue {
40ad96e867SJean-Philippe Brucker int id;
41ad96e867SJean-Philippe Brucker struct net_dev *ndev;
42ad96e867SJean-Philippe Brucker struct virt_queue vq;
43ad96e867SJean-Philippe Brucker pthread_t thread;
44ad96e867SJean-Philippe Brucker struct mutex lock;
45ad96e867SJean-Philippe Brucker pthread_cond_t cond;
46ad96e867SJean-Philippe Brucker };
47ad96e867SJean-Philippe Brucker
488626798bSAsias He struct net_dev {
49d3476f7dSSasha Levin struct mutex mutex;
5002eca50cSAsias He struct virtio_device vdev;
519a6d73f1SSasha Levin struct list_head list;
524f56d42cSAsias He
53ad96e867SJean-Philippe Brucker struct net_dev_queue queues[VIRTIO_NET_NUM_QUEUES * 2 + 1];
54c229370aSIngo Molnar struct virtio_net_config config;
55902a8ecbSJean-Philippe Brucker u32 queue_pairs;
56c4aa7c02SPekka Enberg
579ed67cdcSSasha Levin int vhost_fd;
584f56d42cSAsias He int tap_fd;
594f56d42cSAsias He char tap_name[IFNAMSIZ];
6059ee54ebSWei Chen bool tap_ufo;
61bb1a32f1SAsias He
62bb1a32f1SAsias He int mode;
63bb1a32f1SAsias He
64b5ee1ea7SAsias He struct uip_info info;
65b4fdde6dSAsias He struct net_dev_operations *ops;
669a6d73f1SSasha Levin struct kvm *kvm;
678c0ae74dSSasha Levin
688c0ae74dSSasha Levin struct virtio_net_params *params;
694f56d42cSAsias He };
704f56d42cSAsias He
719a6d73f1SSasha Levin static LIST_HEAD(ndevs);
72312c62d1SSasha Levin static int compat_id = -1;
734f56d42cSAsias He
747668c3a6SSasha Levin #define MAX_PACKET_SIZE 65550
757668c3a6SSasha Levin
has_virtio_feature(struct net_dev * ndev,u32 feature)767668c3a6SSasha Levin static bool has_virtio_feature(struct net_dev *ndev, u32 feature)
777668c3a6SSasha Levin {
78902a8ecbSJean-Philippe Brucker return ndev->vdev.features & (1 << feature);
797668c3a6SSasha Levin }
807668c3a6SSasha Levin
virtio_net_hdr_len(struct net_dev * ndev)81b231683cSJean-Philippe Brucker static int virtio_net_hdr_len(struct net_dev *ndev)
82b231683cSJean-Philippe Brucker {
83b231683cSJean-Philippe Brucker if (has_virtio_feature(ndev, VIRTIO_NET_F_MRG_RXBUF) ||
84b231683cSJean-Philippe Brucker !ndev->vdev.legacy)
85b231683cSJean-Philippe Brucker return sizeof(struct virtio_net_hdr_mrg_rxbuf);
86b231683cSJean-Philippe Brucker
87b231683cSJean-Philippe Brucker return sizeof(struct virtio_net_hdr);
88b231683cSJean-Philippe Brucker }
89b231683cSJean-Philippe Brucker
virtio_net_rx_thread(void * p)90c4aa7c02SPekka Enberg static void *virtio_net_rx_thread(void *p)
914f56d42cSAsias He {
924f56d42cSAsias He struct iovec iov[VIRTIO_NET_QUEUE_SIZE];
93ad96e867SJean-Philippe Brucker struct net_dev_queue *queue = p;
94ad96e867SJean-Philippe Brucker struct virt_queue *vq = &queue->vq;
95ad96e867SJean-Philippe Brucker struct net_dev *ndev = queue->ndev;
9643835ac9SSasha Levin struct kvm *kvm;
973fdf659dSSasha Levin u16 out, in;
983fdf659dSSasha Levin u16 head;
996d6cc14bSWill Deacon int len, copied;
1004f56d42cSAsias He
101a4d8c55eSSasha Levin kvm__set_thread_name("virtio-net-rx");
102a4d8c55eSSasha Levin
1039a6d73f1SSasha Levin kvm = ndev->kvm;
104c4aa7c02SPekka Enberg while (1) {
105ad96e867SJean-Philippe Brucker mutex_lock(&queue->lock);
106c4aa7c02SPekka Enberg if (!virt_queue__available(vq))
107ad96e867SJean-Philippe Brucker pthread_cond_wait(&queue->cond, &queue->lock.mutex);
108ad96e867SJean-Philippe Brucker mutex_unlock(&queue->lock);
1094f56d42cSAsias He
1104f56d42cSAsias He while (virt_queue__available(vq)) {
1117668c3a6SSasha Levin unsigned char buffer[MAX_PACKET_SIZE + sizeof(struct virtio_net_hdr_mrg_rxbuf)];
1127668c3a6SSasha Levin struct iovec dummy_iov = {
1137668c3a6SSasha Levin .iov_base = buffer,
1147668c3a6SSasha Levin .iov_len = sizeof(buffer),
1157668c3a6SSasha Levin };
1167668c3a6SSasha Levin struct virtio_net_hdr_mrg_rxbuf *hdr;
1173fea89a9SWill Deacon u16 num_buffers;
1187f5ffaf5SAsias He
1197668c3a6SSasha Levin len = ndev->ops->rx(&dummy_iov, 1, ndev);
1206d6cc14bSWill Deacon if (len < 0) {
1216d6cc14bSWill Deacon pr_warning("%s: rx on vq %u failed (%d), exiting thread\n",
122ad96e867SJean-Philippe Brucker __func__, queue->id, len);
1236d6cc14bSWill Deacon goto out_err;
1246d6cc14bSWill Deacon }
1256d6cc14bSWill Deacon
1263fea89a9SWill Deacon copied = num_buffers = 0;
1277668c3a6SSasha Levin head = virt_queue__get_iov(vq, iov, &out, &in, kvm);
1288ed60bbeSMarc Zyngier hdr = iov[0].iov_base;
1297668c3a6SSasha Levin while (copied < len) {
1306d6cc14bSWill Deacon size_t iovsize = min_t(size_t, len - copied, iov_size(iov, in));
1317668c3a6SSasha Levin
132e2493047SAsias He memcpy_toiovec(iov, buffer + copied, iovsize);
1337668c3a6SSasha Levin copied += iovsize;
1343fea89a9SWill Deacon virt_queue__set_used_elem_no_update(vq, head, iovsize, num_buffers++);
1357668c3a6SSasha Levin if (copied == len)
1367668c3a6SSasha Levin break;
1377668c3a6SSasha Levin while (!virt_queue__available(vq))
1387668c3a6SSasha Levin sleep(0);
1397668c3a6SSasha Levin head = virt_queue__get_iov(vq, iov, &out, &in, kvm);
1407668c3a6SSasha Levin }
1413fea89a9SWill Deacon
142b231683cSJean-Philippe Brucker /*
143b231683cSJean-Philippe Brucker * The device MUST set num_buffers, except in the case
144b231683cSJean-Philippe Brucker * where the legacy driver did not negotiate
145b231683cSJean-Philippe Brucker * VIRTIO_NET_F_MRG_RXBUF and the field does not exist.
146b231683cSJean-Philippe Brucker */
147b231683cSJean-Philippe Brucker if (has_virtio_feature(ndev, VIRTIO_NET_F_MRG_RXBUF) ||
148b231683cSJean-Philippe Brucker !ndev->vdev.legacy)
149b17552eeSAndre Przywara hdr->num_buffers = virtio_host_to_guest_u16(vq->endian, num_buffers);
1503fea89a9SWill Deacon
1513fea89a9SWill Deacon virt_queue__used_idx_advance(vq, num_buffers);
1523fea89a9SWill Deacon
153c4aa7c02SPekka Enberg /* We should interrupt guest right now, otherwise latency is huge. */
1546585ffb7SSasha Levin if (virtio_queue__should_signal(vq))
155ad96e867SJean-Philippe Brucker ndev->vdev.ops->signal_vq(kvm, &ndev->vdev, queue->id);
1564f56d42cSAsias He }
157c4aa7c02SPekka Enberg }
158c4aa7c02SPekka Enberg
1596d6cc14bSWill Deacon out_err:
160c4aa7c02SPekka Enberg pthread_exit(NULL);
161c4aa7c02SPekka Enberg return NULL;
162c4aa7c02SPekka Enberg
163c4aa7c02SPekka Enberg }
164c4aa7c02SPekka Enberg
virtio_net_tx_thread(void * p)165c4aa7c02SPekka Enberg static void *virtio_net_tx_thread(void *p)
1664f56d42cSAsias He {
1674f56d42cSAsias He struct iovec iov[VIRTIO_NET_QUEUE_SIZE];
168ad96e867SJean-Philippe Brucker struct net_dev_queue *queue = p;
169ad96e867SJean-Philippe Brucker struct virt_queue *vq = &queue->vq;
170ad96e867SJean-Philippe Brucker struct net_dev *ndev = queue->ndev;
17143835ac9SSasha Levin struct kvm *kvm;
1723fdf659dSSasha Levin u16 out, in;
1733fdf659dSSasha Levin u16 head;
1744f56d42cSAsias He int len;
1754f56d42cSAsias He
176a4d8c55eSSasha Levin kvm__set_thread_name("virtio-net-tx");
177a4d8c55eSSasha Levin
1789a6d73f1SSasha Levin kvm = ndev->kvm;
179c4aa7c02SPekka Enberg
180c4aa7c02SPekka Enberg while (1) {
181ad96e867SJean-Philippe Brucker mutex_lock(&queue->lock);
182c4aa7c02SPekka Enberg if (!virt_queue__available(vq))
183ad96e867SJean-Philippe Brucker pthread_cond_wait(&queue->cond, &queue->lock.mutex);
184ad96e867SJean-Philippe Brucker mutex_unlock(&queue->lock);
1854f56d42cSAsias He
1864f56d42cSAsias He while (virt_queue__available(vq)) {
18743835ac9SSasha Levin head = virt_queue__get_iov(vq, iov, &out, &in, kvm);
1889a6d73f1SSasha Levin len = ndev->ops->tx(iov, out, ndev);
1896d6cc14bSWill Deacon if (len < 0) {
1906d6cc14bSWill Deacon pr_warning("%s: tx on vq %u failed (%d)\n",
191ad96e867SJean-Philippe Brucker __func__, queue->id, errno);
1926d6cc14bSWill Deacon goto out_err;
1936d6cc14bSWill Deacon }
1946d6cc14bSWill Deacon
1954f56d42cSAsias He virt_queue__set_used_elem(vq, head, len);
1964f56d42cSAsias He }
1974f56d42cSAsias He
1986585ffb7SSasha Levin if (virtio_queue__should_signal(vq))
199ad96e867SJean-Philippe Brucker ndev->vdev.ops->signal_vq(kvm, &ndev->vdev, queue->id);
2004f56d42cSAsias He }
2014f56d42cSAsias He
2026d6cc14bSWill Deacon out_err:
203c4aa7c02SPekka Enberg pthread_exit(NULL);
204c4aa7c02SPekka Enberg return NULL;
205c4aa7c02SPekka Enberg }
206407475bfSPekka Enberg
virtio_net_handle_mq(struct kvm * kvm,struct net_dev * ndev,struct virtio_net_ctrl_hdr * ctrl)2076585ffb7SSasha Levin static virtio_net_ctrl_ack virtio_net_handle_mq(struct kvm* kvm, struct net_dev *ndev, struct virtio_net_ctrl_hdr *ctrl)
2086585ffb7SSasha Levin {
2096585ffb7SSasha Levin /* Not much to do here */
2106585ffb7SSasha Levin return VIRTIO_NET_OK;
2116585ffb7SSasha Levin }
2126585ffb7SSasha Levin
virtio_net_ctrl_thread(void * p)2136585ffb7SSasha Levin static void *virtio_net_ctrl_thread(void *p)
214abd4a801SSasha Levin {
215abd4a801SSasha Levin struct iovec iov[VIRTIO_NET_QUEUE_SIZE];
216ad96e867SJean-Philippe Brucker struct net_dev_queue *queue = p;
217ad96e867SJean-Philippe Brucker struct virt_queue *vq = &queue->vq;
218ad96e867SJean-Philippe Brucker struct net_dev *ndev = queue->ndev;
219abd4a801SSasha Levin u16 out, in, head;
2206585ffb7SSasha Levin struct kvm *kvm = ndev->kvm;
2216daffe57SJean-Philippe Brucker struct virtio_net_ctrl_hdr ctrl;
2226daffe57SJean-Philippe Brucker virtio_net_ctrl_ack ack;
2236daffe57SJean-Philippe Brucker size_t len;
224abd4a801SSasha Levin
225edb4a8a0SSuzuki K. Poulose kvm__set_thread_name("virtio-net-ctrl");
226edb4a8a0SSuzuki K. Poulose
2276585ffb7SSasha Levin while (1) {
228ad96e867SJean-Philippe Brucker mutex_lock(&queue->lock);
2296585ffb7SSasha Levin if (!virt_queue__available(vq))
230ad96e867SJean-Philippe Brucker pthread_cond_wait(&queue->cond, &queue->lock.mutex);
231ad96e867SJean-Philippe Brucker mutex_unlock(&queue->lock);
2326585ffb7SSasha Levin
2336585ffb7SSasha Levin while (virt_queue__available(vq)) {
234ad96e867SJean-Philippe Brucker head = virt_queue__get_iov(vq, iov, &out, &in, kvm);
2356daffe57SJean-Philippe Brucker len = min(iov_size(iov, in), sizeof(ctrl));
2366daffe57SJean-Philippe Brucker memcpy_fromiovec((void *)&ctrl, iov, len);
237abd4a801SSasha Levin
2386daffe57SJean-Philippe Brucker switch (ctrl.class) {
2396585ffb7SSasha Levin case VIRTIO_NET_CTRL_MQ:
2406daffe57SJean-Philippe Brucker ack = virtio_net_handle_mq(kvm, ndev, &ctrl);
2416585ffb7SSasha Levin break;
242abd4a801SSasha Levin default:
2436daffe57SJean-Philippe Brucker ack = VIRTIO_NET_ERR;
244abd4a801SSasha Levin break;
245abd4a801SSasha Levin }
2466daffe57SJean-Philippe Brucker memcpy_toiovec(iov + in, &ack, sizeof(ack));
2476daffe57SJean-Philippe Brucker virt_queue__set_used_elem(vq, head, sizeof(ack));
2486585ffb7SSasha Levin }
249abd4a801SSasha Levin
250ad96e867SJean-Philippe Brucker if (virtio_queue__should_signal(vq))
251ad96e867SJean-Philippe Brucker ndev->vdev.ops->signal_vq(kvm, &ndev->vdev, queue->id);
2526585ffb7SSasha Levin }
253abd4a801SSasha Levin
2546585ffb7SSasha Levin pthread_exit(NULL);
255abd4a801SSasha Levin
2566585ffb7SSasha Levin return NULL;
257abd4a801SSasha Levin }
258abd4a801SSasha Levin
virtio_net_handle_callback(struct kvm * kvm,struct net_dev * ndev,int queue)2599a6d73f1SSasha Levin static void virtio_net_handle_callback(struct kvm *kvm, struct net_dev *ndev, int queue)
2604f56d42cSAsias He {
261ad96e867SJean-Philippe Brucker struct net_dev_queue *net_queue = &ndev->queues[queue];
262ad96e867SJean-Philippe Brucker
26379052597SSasha Levin if ((u32)queue >= (ndev->queue_pairs * 2 + 1)) {
2649a6d73f1SSasha Levin pr_warning("Unknown queue index %u", queue);
2656585ffb7SSasha Levin return;
266c4aa7c02SPekka Enberg }
2676585ffb7SSasha Levin
268ad96e867SJean-Philippe Brucker mutex_lock(&net_queue->lock);
269ad96e867SJean-Philippe Brucker pthread_cond_signal(&net_queue->cond);
270ad96e867SJean-Philippe Brucker mutex_unlock(&net_queue->lock);
2714f56d42cSAsias He }
2724f56d42cSAsias He
virtio_net_request_tap(struct net_dev * ndev,struct ifreq * ifr,const char * tapname)273d2a7ddffSMarc Zyngier static int virtio_net_request_tap(struct net_dev *ndev, struct ifreq *ifr,
274d2a7ddffSMarc Zyngier const char *tapname)
275d2a7ddffSMarc Zyngier {
276d2a7ddffSMarc Zyngier int ret;
277d2a7ddffSMarc Zyngier
278d2a7ddffSMarc Zyngier memset(ifr, 0, sizeof(*ifr));
279d2a7ddffSMarc Zyngier ifr->ifr_flags = IFF_TAP | IFF_NO_PI | IFF_VNET_HDR;
280d2a7ddffSMarc Zyngier if (tapname)
28105755b29SAndre Przywara strlcpy(ifr->ifr_name, tapname, sizeof(ifr->ifr_name));
282d2a7ddffSMarc Zyngier
283f83dc816SAndreas Herrmann ret = ioctl(ndev->tap_fd, TUNSETIFF, ifr);
284d2a7ddffSMarc Zyngier
285d2a7ddffSMarc Zyngier if (ret >= 0)
28605755b29SAndre Przywara strlcpy(ndev->tap_name, ifr->ifr_name, sizeof(ndev->tap_name));
287d2a7ddffSMarc Zyngier return ret;
288d2a7ddffSMarc Zyngier }
289d2a7ddffSMarc Zyngier
virtio_net_exec_script(const char * script,const char * tap_name)290eef27ae3SFan Du static int virtio_net_exec_script(const char* script, const char *tap_name)
291eef27ae3SFan Du {
292eef27ae3SFan Du pid_t pid;
293eef27ae3SFan Du int status;
294eef27ae3SFan Du
2959987a37cSSuzuki K Poulose pid = vfork();
296eef27ae3SFan Du if (pid == 0) {
297eef27ae3SFan Du execl(script, script, tap_name, NULL);
298eef27ae3SFan Du _exit(1);
299eef27ae3SFan Du } else {
300eef27ae3SFan Du waitpid(pid, &status, 0);
301eef27ae3SFan Du if (WIFEXITED(status) && WEXITSTATUS(status) != 0) {
302eef27ae3SFan Du pr_warning("Fail to setup tap by %s", script);
303eef27ae3SFan Du return -1;
304eef27ae3SFan Du }
305eef27ae3SFan Du }
306eef27ae3SFan Du return 0;
307eef27ae3SFan Du }
308eef27ae3SFan Du
virtio_net__tap_init(struct net_dev * ndev)3098c0ae74dSSasha Levin static bool virtio_net__tap_init(struct net_dev *ndev)
3104f56d42cSAsias He {
311cb7202c1SSasha Levin int sock = socket(AF_INET, SOCK_STREAM, 0);
31259ee54ebSWei Chen int hdr_len;
313cb7202c1SSasha Levin struct sockaddr_in sin = {0};
314246c8347SAsias He struct ifreq ifr;
3158c0ae74dSSasha Levin const struct virtio_net_params *params = ndev->params;
3161dfc7c24SMarc Zyngier bool skipconf = !!params->tapif;
3174f56d42cSAsias He
318b231683cSJean-Philippe Brucker hdr_len = virtio_net_hdr_len(ndev);
3199a6d73f1SSasha Levin if (ioctl(ndev->tap_fd, TUNSETVNETHDRSZ, &hdr_len) < 0)
3204542f276SCyrill Gorcunov pr_warning("Config tap device TUNSETVNETHDRSZ error");
321246c8347SAsias He
32273b7d038SAmos Kong if (strcmp(params->script, "none")) {
323eef27ae3SFan Du if (virtio_net_exec_script(params->script, ndev->tap_name) < 0)
32473b7d038SAmos Kong goto fail;
3251dfc7c24SMarc Zyngier } else if (!skipconf) {
326cb7202c1SSasha Levin memset(&ifr, 0, sizeof(ifr));
32716509081SAnisse Astier strncpy(ifr.ifr_name, ndev->tap_name, sizeof(ifr.ifr_name));
328bdfcfca6SSasha Levin sin.sin_addr.s_addr = inet_addr(params->host_ip);
329cb7202c1SSasha Levin memcpy(&(ifr.ifr_addr), &sin, sizeof(ifr.ifr_addr));
330cb7202c1SSasha Levin ifr.ifr_addr.sa_family = AF_INET;
3313b02f580SSasha Levin if (ioctl(sock, SIOCSIFADDR, &ifr) < 0) {
3324542f276SCyrill Gorcunov pr_warning("Could not set ip address on tap device");
3333b02f580SSasha Levin goto fail;
3343b02f580SSasha Levin }
33573b7d038SAmos Kong }
336cb7202c1SSasha Levin
3371dfc7c24SMarc Zyngier if (!skipconf) {
338cb7202c1SSasha Levin memset(&ifr, 0, sizeof(ifr));
33916509081SAnisse Astier strncpy(ifr.ifr_name, ndev->tap_name, sizeof(ifr.ifr_name));
340cb7202c1SSasha Levin ioctl(sock, SIOCGIFFLAGS, &ifr);
341cb7202c1SSasha Levin ifr.ifr_flags |= IFF_UP | IFF_RUNNING;
342cb7202c1SSasha Levin if (ioctl(sock, SIOCSIFFLAGS, &ifr) < 0)
3434542f276SCyrill Gorcunov pr_warning("Could not bring tap device up");
3441dfc7c24SMarc Zyngier }
345cb7202c1SSasha Levin
346cb7202c1SSasha Levin close(sock);
3473b02f580SSasha Levin
3483b02f580SSasha Levin return 1;
3493b02f580SSasha Levin
3503b02f580SSasha Levin fail:
3513b02f580SSasha Levin if (sock >= 0)
3523b02f580SSasha Levin close(sock);
3539a6d73f1SSasha Levin if (ndev->tap_fd >= 0)
3549a6d73f1SSasha Levin close(ndev->tap_fd);
3553b02f580SSasha Levin
3563b02f580SSasha Levin return 0;
3574f56d42cSAsias He }
3584f56d42cSAsias He
virtio_net__tap_exit(struct net_dev * ndev)35949bada43SJean-Philippe Brucker static void virtio_net__tap_exit(struct net_dev *ndev)
36049bada43SJean-Philippe Brucker {
36149bada43SJean-Philippe Brucker int sock;
36249bada43SJean-Philippe Brucker struct ifreq ifr;
36349bada43SJean-Philippe Brucker
36449bada43SJean-Philippe Brucker if (ndev->params->tapif)
36549bada43SJean-Philippe Brucker return;
36649bada43SJean-Philippe Brucker
36749bada43SJean-Philippe Brucker sock = socket(AF_INET, SOCK_STREAM, 0);
36816509081SAnisse Astier strncpy(ifr.ifr_name, ndev->tap_name, sizeof(ifr.ifr_name));
36949bada43SJean-Philippe Brucker ioctl(sock, SIOCGIFFLAGS, &ifr);
37049bada43SJean-Philippe Brucker ifr.ifr_flags &= ~(IFF_UP | IFF_RUNNING);
37149bada43SJean-Philippe Brucker if (ioctl(sock, SIOCGIFFLAGS, &ifr) < 0)
37249bada43SJean-Philippe Brucker pr_warning("Count not bring tap device down");
37349bada43SJean-Philippe Brucker close(sock);
37449bada43SJean-Philippe Brucker }
37549bada43SJean-Philippe Brucker
virtio_net__tap_create(struct net_dev * ndev)37659ee54ebSWei Chen static bool virtio_net__tap_create(struct net_dev *ndev)
37759ee54ebSWei Chen {
37859ee54ebSWei Chen int offload;
37959ee54ebSWei Chen struct ifreq ifr;
38059ee54ebSWei Chen const struct virtio_net_params *params = ndev->params;
38159ee54ebSWei Chen bool macvtap = (!!params->tapif) && (params->tapif[0] == '/');
38259ee54ebSWei Chen
38359ee54ebSWei Chen /* Did the user already gave us the FD? */
38459ee54ebSWei Chen if (params->fd)
38559ee54ebSWei Chen ndev->tap_fd = params->fd;
38659ee54ebSWei Chen else {
38759ee54ebSWei Chen const char *tap_file = "/dev/net/tun";
38859ee54ebSWei Chen
38959ee54ebSWei Chen /* Did the user ask us to use macvtap? */
39059ee54ebSWei Chen if (macvtap)
39159ee54ebSWei Chen tap_file = params->tapif;
39259ee54ebSWei Chen
39359ee54ebSWei Chen ndev->tap_fd = open(tap_file, O_RDWR);
39459ee54ebSWei Chen if (ndev->tap_fd < 0) {
39559ee54ebSWei Chen pr_warning("Unable to open %s", tap_file);
39659ee54ebSWei Chen return 0;
39759ee54ebSWei Chen }
39859ee54ebSWei Chen }
39959ee54ebSWei Chen
40059ee54ebSWei Chen if (!macvtap &&
40159ee54ebSWei Chen virtio_net_request_tap(ndev, &ifr, params->tapif) < 0) {
40259ee54ebSWei Chen pr_warning("Config tap device error. Are you root?");
40359ee54ebSWei Chen goto fail;
40459ee54ebSWei Chen }
40559ee54ebSWei Chen
40659ee54ebSWei Chen /*
40759ee54ebSWei Chen * The UFO support had been removed from kernel in commit:
40859ee54ebSWei Chen * ID: fb652fdfe83710da0ca13448a41b7ed027d0a984
40959ee54ebSWei Chen * https://www.spinics.net/lists/netdev/msg443562.html
41059ee54ebSWei Chen * In oder to support the older kernels without this commit,
41159ee54ebSWei Chen * we set the TUN_F_UFO to offload by default to test the status of
41259ee54ebSWei Chen * UFO kernel support.
41359ee54ebSWei Chen */
41459ee54ebSWei Chen ndev->tap_ufo = true;
41559ee54ebSWei Chen offload = TUN_F_CSUM | TUN_F_TSO4 | TUN_F_TSO6 | TUN_F_UFO;
41659ee54ebSWei Chen if (ioctl(ndev->tap_fd, TUNSETOFFLOAD, offload) < 0) {
41759ee54ebSWei Chen /*
41859ee54ebSWei Chen * Is this failure caused by kernel remove the UFO support?
41959ee54ebSWei Chen * Try TUNSETOFFLOAD without TUN_F_UFO.
42059ee54ebSWei Chen */
42159ee54ebSWei Chen offload &= ~TUN_F_UFO;
42259ee54ebSWei Chen if (ioctl(ndev->tap_fd, TUNSETOFFLOAD, offload) < 0) {
42359ee54ebSWei Chen pr_warning("Config tap device TUNSETOFFLOAD error");
42459ee54ebSWei Chen goto fail;
42559ee54ebSWei Chen }
42659ee54ebSWei Chen ndev->tap_ufo = false;
42759ee54ebSWei Chen }
42859ee54ebSWei Chen
42959ee54ebSWei Chen return 1;
43059ee54ebSWei Chen
43159ee54ebSWei Chen fail:
43259ee54ebSWei Chen if ((ndev->tap_fd >= 0) || (!params->fd) )
43359ee54ebSWei Chen close(ndev->tap_fd);
43459ee54ebSWei Chen
43559ee54ebSWei Chen return 0;
43659ee54ebSWei Chen }
43759ee54ebSWei Chen
tap_ops_tx(struct iovec * iov,u16 out,struct net_dev * ndev)438b4fdde6dSAsias He static inline int tap_ops_tx(struct iovec *iov, u16 out, struct net_dev *ndev)
439b4fdde6dSAsias He {
440b4fdde6dSAsias He return writev(ndev->tap_fd, iov, out);
441b4fdde6dSAsias He }
442b4fdde6dSAsias He
tap_ops_rx(struct iovec * iov,u16 in,struct net_dev * ndev)443b4fdde6dSAsias He static inline int tap_ops_rx(struct iovec *iov, u16 in, struct net_dev *ndev)
444b4fdde6dSAsias He {
445b4fdde6dSAsias He return readv(ndev->tap_fd, iov, in);
446b4fdde6dSAsias He }
447b4fdde6dSAsias He
uip_ops_tx(struct iovec * iov,u16 out,struct net_dev * ndev)448b4fdde6dSAsias He static inline int uip_ops_tx(struct iovec *iov, u16 out, struct net_dev *ndev)
449b4fdde6dSAsias He {
450b4fdde6dSAsias He return uip_tx(iov, out, &ndev->info);
451b4fdde6dSAsias He }
452b4fdde6dSAsias He
uip_ops_rx(struct iovec * iov,u16 in,struct net_dev * ndev)453b4fdde6dSAsias He static inline int uip_ops_rx(struct iovec *iov, u16 in, struct net_dev *ndev)
454b4fdde6dSAsias He {
455b4fdde6dSAsias He return uip_rx(iov, in, &ndev->info);
456b4fdde6dSAsias He }
457b4fdde6dSAsias He
458b4fdde6dSAsias He static struct net_dev_operations tap_ops = {
459b4fdde6dSAsias He .rx = tap_ops_rx,
460b4fdde6dSAsias He .tx = tap_ops_tx,
461b4fdde6dSAsias He };
462b4fdde6dSAsias He
463b4fdde6dSAsias He static struct net_dev_operations uip_ops = {
464b4fdde6dSAsias He .rx = uip_ops_rx,
465b4fdde6dSAsias He .tx = uip_ops_tx,
466b4fdde6dSAsias He };
467b4fdde6dSAsias He
get_config(struct kvm * kvm,void * dev)468c5ae742bSSasha Levin static u8 *get_config(struct kvm *kvm, void *dev)
46978a2a3e2SSasha Levin {
47078a2a3e2SSasha Levin struct net_dev *ndev = dev;
47178a2a3e2SSasha Levin
472c5ae742bSSasha Levin return ((u8 *)(&ndev->config));
47378a2a3e2SSasha Levin }
47478a2a3e2SSasha Levin
get_config_size(struct kvm * kvm,void * dev)475e4730284SMartin Radev static size_t get_config_size(struct kvm *kvm, void *dev)
476e4730284SMartin Radev {
477e4730284SMartin Radev struct net_dev *ndev = dev;
478e4730284SMartin Radev
479e4730284SMartin Radev return sizeof(ndev->config);
480e4730284SMartin Radev }
481e4730284SMartin Radev
get_host_features(struct kvm * kvm,void * dev)4823c8f82b8SJean-Philippe Brucker static u64 get_host_features(struct kvm *kvm, void *dev)
48378a2a3e2SSasha Levin {
4843c8f82b8SJean-Philippe Brucker u64 features;
48579052597SSasha Levin struct net_dev *ndev = dev;
48679052597SSasha Levin
48759ee54ebSWei Chen features = 1UL << VIRTIO_NET_F_MAC
48878a2a3e2SSasha Levin | 1UL << VIRTIO_NET_F_CSUM
48978a2a3e2SSasha Levin | 1UL << VIRTIO_NET_F_HOST_TSO4
49078a2a3e2SSasha Levin | 1UL << VIRTIO_NET_F_HOST_TSO6
49178a2a3e2SSasha Levin | 1UL << VIRTIO_NET_F_GUEST_TSO4
49292c1f37bSSasha Levin | 1UL << VIRTIO_NET_F_GUEST_TSO6
493754c8ce3SSasha Levin | 1UL << VIRTIO_RING_F_EVENT_IDX
494abd4a801SSasha Levin | 1UL << VIRTIO_RING_F_INDIRECT_DESC
4956585ffb7SSasha Levin | 1UL << VIRTIO_NET_F_CTRL_VQ
4967668c3a6SSasha Levin | 1UL << VIRTIO_NET_F_MRG_RXBUF
4976daffe57SJean-Philippe Brucker | 1UL << (ndev->queue_pairs > 1 ? VIRTIO_NET_F_MQ : 0)
4986daffe57SJean-Philippe Brucker | 1UL << VIRTIO_F_ANY_LAYOUT;
49959ee54ebSWei Chen
50059ee54ebSWei Chen /*
50159ee54ebSWei Chen * The UFO feature for host and guest only can be enabled when the
50259ee54ebSWei Chen * kernel has TAP UFO support.
50359ee54ebSWei Chen */
50459ee54ebSWei Chen if (ndev->tap_ufo)
50559ee54ebSWei Chen features |= (1UL << VIRTIO_NET_F_HOST_UFO
50659ee54ebSWei Chen | 1UL << VIRTIO_NET_F_GUEST_UFO);
50759ee54ebSWei Chen
50853171d59SJean-Philippe Brucker if (ndev->vhost_fd) {
50915636d5eSYing-Shiuan Pan u64 vhost_features;
51015636d5eSYing-Shiuan Pan
51115636d5eSYing-Shiuan Pan if (ioctl(ndev->vhost_fd, VHOST_GET_FEATURES, &vhost_features) != 0)
51215636d5eSYing-Shiuan Pan die_perror("VHOST_GET_FEATURES failed");
51315636d5eSYing-Shiuan Pan
51453171d59SJean-Philippe Brucker features &= vhost_features;
51553171d59SJean-Philippe Brucker }
51653171d59SJean-Philippe Brucker
51753171d59SJean-Philippe Brucker return features;
51853171d59SJean-Philippe Brucker }
51953171d59SJean-Philippe Brucker
virtio_net_start(struct net_dev * ndev)52095242e44SJean-Philippe Brucker static void virtio_net_start(struct net_dev *ndev)
52195242e44SJean-Philippe Brucker {
5223b1cdcf9SJean-Philippe Brucker /* VHOST_NET_F_VIRTIO_NET_HDR clashes with VIRTIO_F_ANY_LAYOUT! */
5233b1cdcf9SJean-Philippe Brucker u64 features = ndev->vdev.features & ~(1UL << VHOST_NET_F_VIRTIO_NET_HDR);
5243b1cdcf9SJean-Philippe Brucker
5258aa155c4SYing-Shiuan Pan if (ndev->mode == NET_MODE_TAP) {
5268aa155c4SYing-Shiuan Pan if (!virtio_net__tap_init(ndev))
52759ee54ebSWei Chen die_perror("TAP device initialized failed because");
52859ee54ebSWei Chen
5293b1cdcf9SJean-Philippe Brucker if (ndev->vhost_fd && virtio_vhost_set_features(ndev->vhost_fd,
5303b1cdcf9SJean-Philippe Brucker features))
53115636d5eSYing-Shiuan Pan die_perror("VHOST_SET_FEATURES failed");
5328aa155c4SYing-Shiuan Pan } else {
533b231683cSJean-Philippe Brucker ndev->info.vnet_hdr_len = virtio_net_hdr_len(ndev);
5348aa155c4SYing-Shiuan Pan uip_init(&ndev->info);
5358aa155c4SYing-Shiuan Pan }
53678a2a3e2SSasha Levin }
53778a2a3e2SSasha Levin
virtio_net_stop(struct net_dev * ndev)53849bada43SJean-Philippe Brucker static void virtio_net_stop(struct net_dev *ndev)
53949bada43SJean-Philippe Brucker {
54049bada43SJean-Philippe Brucker /* Undo whatever start() did */
54149bada43SJean-Philippe Brucker if (ndev->mode == NET_MODE_TAP)
54249bada43SJean-Philippe Brucker virtio_net__tap_exit(ndev);
54349bada43SJean-Philippe Brucker else
54449bada43SJean-Philippe Brucker uip_exit(&ndev->info);
54549bada43SJean-Philippe Brucker }
54649bada43SJean-Philippe Brucker
virtio_net_update_endian(struct net_dev * ndev)547867b15ccSJean-Philippe Brucker static void virtio_net_update_endian(struct net_dev *ndev)
548867b15ccSJean-Philippe Brucker {
549867b15ccSJean-Philippe Brucker struct virtio_net_config *conf = &ndev->config;
550867b15ccSJean-Philippe Brucker
551b17552eeSAndre Przywara conf->status = virtio_host_to_guest_u16(ndev->vdev.endian,
552867b15ccSJean-Philippe Brucker VIRTIO_NET_S_LINK_UP);
553b17552eeSAndre Przywara conf->max_virtqueue_pairs = virtio_host_to_guest_u16(ndev->vdev.endian,
554867b15ccSJean-Philippe Brucker ndev->queue_pairs);
5558b27bcffSJean-Philippe Brucker
5568b27bcffSJean-Philippe Brucker /* Let TAP know about vnet header endianness */
5578b27bcffSJean-Philippe Brucker if (ndev->mode == NET_MODE_TAP &&
5588b27bcffSJean-Philippe Brucker ndev->vdev.endian != VIRTIO_ENDIAN_HOST) {
5598b27bcffSJean-Philippe Brucker int enable_val = 1, disable_val = 0;
5608b27bcffSJean-Philippe Brucker int enable_req, disable_req;
5618b27bcffSJean-Philippe Brucker
5628b27bcffSJean-Philippe Brucker if (ndev->vdev.endian == VIRTIO_ENDIAN_LE) {
5638b27bcffSJean-Philippe Brucker enable_req = TUNSETVNETLE;
5648b27bcffSJean-Philippe Brucker disable_req = TUNSETVNETBE;
5658b27bcffSJean-Philippe Brucker } else {
5668b27bcffSJean-Philippe Brucker enable_req = TUNSETVNETBE;
5678b27bcffSJean-Philippe Brucker disable_req = TUNSETVNETLE;
5688b27bcffSJean-Philippe Brucker }
5698b27bcffSJean-Philippe Brucker
5708b27bcffSJean-Philippe Brucker ioctl(ndev->tap_fd, disable_req, &disable_val);
5718b27bcffSJean-Philippe Brucker if (ioctl(ndev->tap_fd, enable_req, &enable_val) < 0)
5728b27bcffSJean-Philippe Brucker pr_err("Config tap device TUNSETVNETLE/BE error");
5738b27bcffSJean-Philippe Brucker }
574867b15ccSJean-Philippe Brucker }
575867b15ccSJean-Philippe Brucker
notify_status(struct kvm * kvm,void * dev,u32 status)57695242e44SJean-Philippe Brucker static void notify_status(struct kvm *kvm, void *dev, u32 status)
57795242e44SJean-Philippe Brucker {
578867b15ccSJean-Philippe Brucker struct net_dev *ndev = dev;
579867b15ccSJean-Philippe Brucker
580867b15ccSJean-Philippe Brucker if (status & VIRTIO__STATUS_CONFIG)
581867b15ccSJean-Philippe Brucker virtio_net_update_endian(ndev);
582867b15ccSJean-Philippe Brucker
58395242e44SJean-Philippe Brucker if (status & VIRTIO__STATUS_START)
58495242e44SJean-Philippe Brucker virtio_net_start(dev);
58549bada43SJean-Philippe Brucker else if (status & VIRTIO__STATUS_STOP)
58649bada43SJean-Philippe Brucker virtio_net_stop(dev);
58795242e44SJean-Philippe Brucker }
58895242e44SJean-Philippe Brucker
is_ctrl_vq(struct net_dev * ndev,u32 vq)5899e56ec14SSasha Levin static bool is_ctrl_vq(struct net_dev *ndev, u32 vq)
5909e56ec14SSasha Levin {
5919e56ec14SSasha Levin return vq == (u32)(ndev->queue_pairs * 2);
5929e56ec14SSasha Levin }
5939e56ec14SSasha Levin
init_vq(struct kvm * kvm,void * dev,u32 vq)594609ee906SJean-Philippe Brucker static int init_vq(struct kvm *kvm, void *dev, u32 vq)
59578a2a3e2SSasha Levin {
596de166e5fSJean-Philippe Brucker struct vhost_vring_file file = { .index = vq };
597ad96e867SJean-Philippe Brucker struct net_dev_queue *net_queue;
59878a2a3e2SSasha Levin struct net_dev *ndev = dev;
59978a2a3e2SSasha Levin struct virt_queue *queue;
6009ed67cdcSSasha Levin int r;
60178a2a3e2SSasha Levin
602312c62d1SSasha Levin compat__remove_message(compat_id);
60378a2a3e2SSasha Levin
604ad96e867SJean-Philippe Brucker net_queue = &ndev->queues[vq];
605ad96e867SJean-Philippe Brucker net_queue->id = vq;
606ad96e867SJean-Philippe Brucker net_queue->ndev = ndev;
607ad96e867SJean-Philippe Brucker queue = &net_queue->vq;
608609ee906SJean-Philippe Brucker virtio_init_device_vq(kvm, &ndev->vdev, queue, VIRTIO_NET_QUEUE_SIZE);
60978a2a3e2SSasha Levin
610ad96e867SJean-Philippe Brucker mutex_init(&net_queue->lock);
611ad96e867SJean-Philippe Brucker pthread_cond_init(&net_queue->cond, NULL);
6129e56ec14SSasha Levin if (is_ctrl_vq(ndev, vq)) {
613ad96e867SJean-Philippe Brucker pthread_create(&net_queue->thread, NULL, virtio_net_ctrl_thread,
614ad96e867SJean-Philippe Brucker net_queue);
6159e56ec14SSasha Levin
6169e56ec14SSasha Levin return 0;
6179e56ec14SSasha Levin } else if (ndev->vhost_fd == 0 ) {
6189e56ec14SSasha Levin if (vq & 1)
619ad96e867SJean-Philippe Brucker pthread_create(&net_queue->thread, NULL,
620ad96e867SJean-Philippe Brucker virtio_net_tx_thread, net_queue);
6216585ffb7SSasha Levin else
622ad96e867SJean-Philippe Brucker pthread_create(&net_queue->thread, NULL,
623ad96e867SJean-Philippe Brucker virtio_net_rx_thread, net_queue);
6246585ffb7SSasha Levin
62578a2a3e2SSasha Levin return 0;
6266585ffb7SSasha Levin }
6279ed67cdcSSasha Levin
628745221e5SJean-Philippe Brucker virtio_vhost_set_vring(kvm, ndev->vhost_fd, vq, queue);
6299ed67cdcSSasha Levin
630de166e5fSJean-Philippe Brucker file.fd = ndev->tap_fd;
631de166e5fSJean-Philippe Brucker r = ioctl(ndev->vhost_fd, VHOST_NET_SET_BACKEND, &file);
632de166e5fSJean-Philippe Brucker if (r < 0)
633de166e5fSJean-Philippe Brucker die_perror("VHOST_NET_SET_BACKEND failed");
634de166e5fSJean-Philippe Brucker
6359ed67cdcSSasha Levin return 0;
6369ed67cdcSSasha Levin }
6379ed67cdcSSasha Levin
exit_vq(struct kvm * kvm,void * dev,u32 vq)63849bada43SJean-Philippe Brucker static void exit_vq(struct kvm *kvm, void *dev, u32 vq)
63949bada43SJean-Philippe Brucker {
64049bada43SJean-Philippe Brucker struct net_dev *ndev = dev;
64149bada43SJean-Philippe Brucker struct net_dev_queue *queue = &ndev->queues[vq];
64249bada43SJean-Philippe Brucker
643029cd2bbSJean-Philippe Brucker virtio_vhost_reset_vring(kvm, ndev->vhost_fd, vq, &queue->vq);
64449bada43SJean-Philippe Brucker
64549bada43SJean-Philippe Brucker /*
64649bada43SJean-Philippe Brucker * TODO: vhost reset owner. It's the only way to cleanly stop vhost, but
64749bada43SJean-Philippe Brucker * we can't restart it at the moment.
64849bada43SJean-Philippe Brucker */
64949bada43SJean-Philippe Brucker if (ndev->vhost_fd && !is_ctrl_vq(ndev, vq)) {
65049bada43SJean-Philippe Brucker pr_warning("Cannot reset VHOST queue");
65149bada43SJean-Philippe Brucker ioctl(ndev->vhost_fd, VHOST_RESET_OWNER);
65249bada43SJean-Philippe Brucker return;
65349bada43SJean-Philippe Brucker }
65449bada43SJean-Philippe Brucker
65549bada43SJean-Philippe Brucker /*
65649bada43SJean-Philippe Brucker * Threads are waiting on cancellation points (readv or
65749bada43SJean-Philippe Brucker * pthread_cond_wait) and should stop gracefully.
65849bada43SJean-Philippe Brucker */
65949bada43SJean-Philippe Brucker pthread_cancel(queue->thread);
66049bada43SJean-Philippe Brucker pthread_join(queue->thread, NULL);
66149bada43SJean-Philippe Brucker }
66249bada43SJean-Philippe Brucker
notify_vq_gsi(struct kvm * kvm,void * dev,u32 vq,u32 gsi)6639ed67cdcSSasha Levin static void notify_vq_gsi(struct kvm *kvm, void *dev, u32 vq, u32 gsi)
6649ed67cdcSSasha Levin {
6659ed67cdcSSasha Levin struct net_dev *ndev = dev;
666ad96e867SJean-Philippe Brucker struct net_dev_queue *queue = &ndev->queues[vq];
6679ed67cdcSSasha Levin
668029cd2bbSJean-Philippe Brucker if (ndev->vhost_fd == 0 || is_ctrl_vq(ndev, vq))
6699ed67cdcSSasha Levin return;
6709ed67cdcSSasha Levin
67146aaf3b8SJean-Philippe Brucker virtio_vhost_set_vring_irqfd(kvm, gsi, &queue->vq);
6729ed67cdcSSasha Levin }
6739ed67cdcSSasha Levin
notify_vq_eventfd(struct kvm * kvm,void * dev,u32 vq,u32 efd)6749ed67cdcSSasha Levin static void notify_vq_eventfd(struct kvm *kvm, void *dev, u32 vq, u32 efd)
6759ed67cdcSSasha Levin {
6769ed67cdcSSasha Levin struct net_dev *ndev = dev;
6779ed67cdcSSasha Levin
6789e56ec14SSasha Levin if (ndev->vhost_fd == 0 || is_ctrl_vq(ndev, vq))
6799ed67cdcSSasha Levin return;
6809ed67cdcSSasha Levin
681676c0c8aSJean-Philippe Brucker virtio_vhost_set_vring_kick(kvm, ndev->vhost_fd, vq, efd);
68278a2a3e2SSasha Levin }
68378a2a3e2SSasha Levin
notify_vq(struct kvm * kvm,void * dev,u32 vq)68478a2a3e2SSasha Levin static int notify_vq(struct kvm *kvm, void *dev, u32 vq)
68578a2a3e2SSasha Levin {
6869a6d73f1SSasha Levin struct net_dev *ndev = dev;
6879a6d73f1SSasha Levin
6889a6d73f1SSasha Levin virtio_net_handle_callback(kvm, ndev, vq);
68978a2a3e2SSasha Levin
69078a2a3e2SSasha Levin return 0;
69178a2a3e2SSasha Levin }
69278a2a3e2SSasha Levin
get_vq(struct kvm * kvm,void * dev,u32 vq)69353fbb17bSJean-Philippe Brucker static struct virt_queue *get_vq(struct kvm *kvm, void *dev, u32 vq)
69478a2a3e2SSasha Levin {
69578a2a3e2SSasha Levin struct net_dev *ndev = dev;
69678a2a3e2SSasha Levin
697ad96e867SJean-Philippe Brucker return &ndev->queues[vq].vq;
69878a2a3e2SSasha Levin }
69978a2a3e2SSasha Levin
get_size_vq(struct kvm * kvm,void * dev,u32 vq)70078a2a3e2SSasha Levin static int get_size_vq(struct kvm *kvm, void *dev, u32 vq)
70178a2a3e2SSasha Levin {
7020f4f51a8SAsias He /* FIXME: dynamic */
70378a2a3e2SSasha Levin return VIRTIO_NET_QUEUE_SIZE;
70478a2a3e2SSasha Levin }
70578a2a3e2SSasha Levin
set_size_vq(struct kvm * kvm,void * dev,u32 vq,int size)7060f4f51a8SAsias He static int set_size_vq(struct kvm *kvm, void *dev, u32 vq, int size)
7070f4f51a8SAsias He {
7080f4f51a8SAsias He /* FIXME: dynamic */
7090f4f51a8SAsias He return size;
7100f4f51a8SAsias He }
7110f4f51a8SAsias He
get_vq_count(struct kvm * kvm,void * dev)71231e0eaccSMartin Radev static unsigned int get_vq_count(struct kvm *kvm, void *dev)
713b98ac591SJean-Philippe Brucker {
714b98ac591SJean-Philippe Brucker struct net_dev *ndev = dev;
715b98ac591SJean-Philippe Brucker
716b98ac591SJean-Philippe Brucker return ndev->queue_pairs * 2 + 1;
717b98ac591SJean-Philippe Brucker }
718b98ac591SJean-Philippe Brucker
71915542babSAndre Przywara static struct virtio_ops net_dev_virtio_ops = {
7201c47ce69SSasha Levin .get_config = get_config,
721e4730284SMartin Radev .get_config_size = get_config_size,
7221c47ce69SSasha Levin .get_host_features = get_host_features,
723b98ac591SJean-Philippe Brucker .get_vq_count = get_vq_count,
7241c47ce69SSasha Levin .init_vq = init_vq,
72549bada43SJean-Philippe Brucker .exit_vq = exit_vq,
72653fbb17bSJean-Philippe Brucker .get_vq = get_vq,
7271c47ce69SSasha Levin .get_size_vq = get_size_vq,
7280f4f51a8SAsias He .set_size_vq = set_size_vq,
7290f4f51a8SAsias He .notify_vq = notify_vq,
7309ed67cdcSSasha Levin .notify_vq_gsi = notify_vq_gsi,
7319ed67cdcSSasha Levin .notify_vq_eventfd = notify_vq_eventfd,
73295242e44SJean-Philippe Brucker .notify_status = notify_status,
7331c47ce69SSasha Levin };
7341c47ce69SSasha Levin
virtio_net__vhost_init(struct kvm * kvm,struct net_dev * ndev)7359ed67cdcSSasha Levin static void virtio_net__vhost_init(struct kvm *kvm, struct net_dev *ndev)
7369ed67cdcSSasha Levin {
7373a70ab1eSJean-Philippe Brucker if (ndev->queue_pairs > 1) {
7383a70ab1eSJean-Philippe Brucker pr_warning("multiqueue is not supported with vhost yet");
7393a70ab1eSJean-Philippe Brucker return;
7403a70ab1eSJean-Philippe Brucker }
7413a70ab1eSJean-Philippe Brucker
7429ed67cdcSSasha Levin ndev->vhost_fd = open("/dev/vhost-net", O_RDWR);
7439ed67cdcSSasha Levin if (ndev->vhost_fd < 0)
7449ed67cdcSSasha Levin die_perror("Failed openning vhost-net device");
7459ed67cdcSSasha Levin
746f84ab9ebSJean-Philippe Brucker virtio_vhost_init(kvm, ndev->vhost_fd);
747627d6874SAsias He
748627d6874SAsias He ndev->vdev.use_vhost = true;
7499ed67cdcSSasha Levin }
7509ed67cdcSSasha Levin
str_to_mac(const char * str,char * mac)7515f225124SSasha Levin static inline void str_to_mac(const char *str, char *mac)
7525f225124SSasha Levin {
7535f225124SSasha Levin sscanf(str, "%hhx:%hhx:%hhx:%hhx:%hhx:%hhx",
7545f225124SSasha Levin mac, mac+1, mac+2, mac+3, mac+4, mac+5);
7555f225124SSasha Levin }
set_net_param(struct kvm * kvm,struct virtio_net_params * p,const char * param,const char * val)7564346fd8fSSasha Levin static int set_net_param(struct kvm *kvm, struct virtio_net_params *p,
7574346fd8fSSasha Levin const char *param, const char *val)
7585f225124SSasha Levin {
7595f225124SSasha Levin if (strcmp(param, "guest_mac") == 0) {
7605f225124SSasha Levin str_to_mac(val, p->guest_mac);
7615f225124SSasha Levin } else if (strcmp(param, "mode") == 0) {
7625f225124SSasha Levin if (!strncmp(val, "user", 4)) {
7635f225124SSasha Levin int i;
7645f225124SSasha Levin
7655f225124SSasha Levin for (i = 0; i < kvm->cfg.num_net_devices; i++)
7665f225124SSasha Levin if (kvm->cfg.net_params[i].mode == NET_MODE_USER)
7675f225124SSasha Levin die("Only one usermode network device allowed at a time");
7685f225124SSasha Levin p->mode = NET_MODE_USER;
7695f225124SSasha Levin } else if (!strncmp(val, "tap", 3)) {
7705f225124SSasha Levin p->mode = NET_MODE_TAP;
7715f225124SSasha Levin } else if (!strncmp(val, "none", 4)) {
7725f225124SSasha Levin kvm->cfg.no_net = 1;
7735f225124SSasha Levin return -1;
7745f225124SSasha Levin } else
7755f225124SSasha Levin die("Unknown network mode %s, please use user, tap or none", kvm->cfg.network);
7765f225124SSasha Levin } else if (strcmp(param, "script") == 0) {
7775f225124SSasha Levin p->script = strdup(val);
778eef27ae3SFan Du } else if (strcmp(param, "downscript") == 0) {
779eef27ae3SFan Du p->downscript = strdup(val);
7805f225124SSasha Levin } else if (strcmp(param, "guest_ip") == 0) {
7815f225124SSasha Levin p->guest_ip = strdup(val);
7825f225124SSasha Levin } else if (strcmp(param, "host_ip") == 0) {
7835f225124SSasha Levin p->host_ip = strdup(val);
7845f225124SSasha Levin } else if (strcmp(param, "trans") == 0) {
7855f225124SSasha Levin p->trans = strdup(val);
7861dfc7c24SMarc Zyngier } else if (strcmp(param, "tapif") == 0) {
7871dfc7c24SMarc Zyngier p->tapif = strdup(val);
7885f225124SSasha Levin } else if (strcmp(param, "vhost") == 0) {
7895f225124SSasha Levin p->vhost = atoi(val);
7905f225124SSasha Levin } else if (strcmp(param, "fd") == 0) {
7915f225124SSasha Levin p->fd = atoi(val);
79279052597SSasha Levin } else if (strcmp(param, "mq") == 0) {
79379052597SSasha Levin p->mq = atoi(val);
7945f225124SSasha Levin } else
7955f225124SSasha Levin die("Unknown network parameter %s", param);
7965f225124SSasha Levin
7975f225124SSasha Levin return 0;
7985f225124SSasha Levin }
7995f225124SSasha Levin
netdev_parser(const struct option * opt,const char * arg,int unset)8005f225124SSasha Levin int netdev_parser(const struct option *opt, const char *arg, int unset)
8015f225124SSasha Levin {
8025f225124SSasha Levin struct virtio_net_params p;
8035f225124SSasha Levin char *buf = NULL, *cmd = NULL, *cur = NULL;
8045f225124SSasha Levin bool on_cmd = true;
8055f225124SSasha Levin struct kvm *kvm = opt->ptr;
8065f225124SSasha Levin
8075f225124SSasha Levin if (arg) {
8085f225124SSasha Levin buf = strdup(arg);
8095f225124SSasha Levin if (buf == NULL)
8105f225124SSasha Levin die("Failed allocating new net buffer");
8115f225124SSasha Levin cur = strtok(buf, ",=");
8125f225124SSasha Levin }
8135f225124SSasha Levin
8145f225124SSasha Levin p = (struct virtio_net_params) {
8155f225124SSasha Levin .guest_ip = DEFAULT_GUEST_ADDR,
8165f225124SSasha Levin .host_ip = DEFAULT_HOST_ADDR,
8175f225124SSasha Levin .script = DEFAULT_SCRIPT,
818eef27ae3SFan Du .downscript = DEFAULT_SCRIPT,
8195f225124SSasha Levin .mode = NET_MODE_TAP,
8205f225124SSasha Levin };
8215f225124SSasha Levin
8225f225124SSasha Levin str_to_mac(DEFAULT_GUEST_MAC, p.guest_mac);
8235f225124SSasha Levin p.guest_mac[5] += kvm->cfg.num_net_devices;
8245f225124SSasha Levin
8255f225124SSasha Levin while (cur) {
8265f225124SSasha Levin if (on_cmd) {
8275f225124SSasha Levin cmd = cur;
8285f225124SSasha Levin } else {
8294346fd8fSSasha Levin if (set_net_param(kvm, &p, cmd, cur) < 0)
8305f225124SSasha Levin goto done;
8315f225124SSasha Levin }
8325f225124SSasha Levin on_cmd = !on_cmd;
8335f225124SSasha Levin
8345f225124SSasha Levin cur = strtok(NULL, ",=");
8355f225124SSasha Levin };
8365f225124SSasha Levin
8375f225124SSasha Levin kvm->cfg.num_net_devices++;
8385f225124SSasha Levin
8395f225124SSasha Levin kvm->cfg.net_params = realloc(kvm->cfg.net_params, kvm->cfg.num_net_devices * sizeof(*kvm->cfg.net_params));
8405f225124SSasha Levin if (kvm->cfg.net_params == NULL)
8415f225124SSasha Levin die("Failed adding new network device");
8425f225124SSasha Levin
8435f225124SSasha Levin kvm->cfg.net_params[kvm->cfg.num_net_devices - 1] = p;
8445f225124SSasha Levin
8455f225124SSasha Levin done:
8465f225124SSasha Levin free(buf);
8475f225124SSasha Levin return 0;
8485f225124SSasha Levin }
8495f225124SSasha Levin
virtio_net__init_one(struct virtio_net_params * params)8504498eb74SAlexandru Elisei static int virtio_net__init_one(struct virtio_net_params *params)
8514f56d42cSAsias He {
8529b46ebc5SRajnesh Kanwal enum virtio_trans trans = params->kvm->cfg.virtio_transport;
8539a6d73f1SSasha Levin struct net_dev *ndev;
85476a4aac6SWill Deacon struct virtio_ops *ops;
8559b46ebc5SRajnesh Kanwal int i, r;
8569a6d73f1SSasha Levin
8579a6d73f1SSasha Levin ndev = calloc(1, sizeof(struct net_dev));
8589a6d73f1SSasha Levin if (ndev == NULL)
8595f225124SSasha Levin return -ENOMEM;
8609a6d73f1SSasha Levin
8619a6d73f1SSasha Levin list_add_tail(&ndev->list, &ndevs);
8629a6d73f1SSasha Levin
863db927775SAlexandru Elisei ops = malloc(sizeof(*ops));
864db927775SAlexandru Elisei if (ops == NULL)
865db927775SAlexandru Elisei return -ENOMEM;
866db927775SAlexandru Elisei
8679a6d73f1SSasha Levin ndev->kvm = params->kvm;
8688c0ae74dSSasha Levin ndev->params = params;
8699a6d73f1SSasha Levin
8709a6d73f1SSasha Levin mutex_init(&ndev->mutex);
87179052597SSasha Levin ndev->queue_pairs = max(1, min(VIRTIO_NET_NUM_QUEUES, params->mq));
87279052597SSasha Levin
8730c54698eSAsias He for (i = 0 ; i < 6 ; i++) {
8749a6d73f1SSasha Levin ndev->config.mac[i] = params->guest_mac[i];
8759a6d73f1SSasha Levin ndev->info.guest_mac.addr[i] = params->guest_mac[i];
8769a6d73f1SSasha Levin ndev->info.host_mac.addr[i] = params->host_mac[i];
8770c54698eSAsias He }
878f715177dSAsias He
8799a6d73f1SSasha Levin ndev->mode = params->mode;
8809a6d73f1SSasha Levin if (ndev->mode == NET_MODE_TAP) {
8819a6d73f1SSasha Levin ndev->ops = &tap_ops;
88259ee54ebSWei Chen if (!virtio_net__tap_create(ndev))
88359ee54ebSWei Chen die_perror("You have requested a TAP device, but creation of one has failed because");
884b4fdde6dSAsias He } else {
8859a6d73f1SSasha Levin ndev->info.host_ip = ntohl(inet_addr(params->host_ip));
8869a6d73f1SSasha Levin ndev->info.guest_ip = ntohl(inet_addr(params->guest_ip));
8879a6d73f1SSasha Levin ndev->info.guest_netmask = ntohl(inet_addr("255.255.255.0"));
8889a6d73f1SSasha Levin ndev->info.buf_nr = 20,
8899a6d73f1SSasha Levin ndev->ops = &uip_ops;
8905f3aaf22SMarc Zyngier uip_static_init(&ndev->info);
891b4fdde6dSAsias He }
892b5ee1ea7SAsias He
89376a4aac6SWill Deacon *ops = net_dev_virtio_ops;
894dc7a55d6SSuzuki K. Poulose
895dc7a55d6SSuzuki K. Poulose if (params->trans) {
896dc7a55d6SSuzuki K. Poulose if (strcmp(params->trans, "mmio") == 0)
897dc7a55d6SSuzuki K. Poulose trans = VIRTIO_MMIO;
898dc7a55d6SSuzuki K. Poulose else if (strcmp(params->trans, "pci") == 0)
899dc7a55d6SSuzuki K. Poulose trans = VIRTIO_PCI;
90069205aa1SAsias He else
901dc7a55d6SSuzuki K. Poulose pr_warning("virtio-net: Unknown transport method : %s, "
902dc7a55d6SSuzuki K. Poulose "falling back to %s.", params->trans,
903dc7a55d6SSuzuki K. Poulose virtio_trans_name(trans));
904dc7a55d6SSuzuki K. Poulose }
905dc7a55d6SSuzuki K. Poulose
906db927775SAlexandru Elisei r = virtio_init(params->kvm, ndev, &ndev->vdev, ops, trans,
90776a4aac6SWill Deacon PCI_DEVICE_ID_VIRTIO_NET, VIRTIO_ID_NET, PCI_CLASS_NET);
908db927775SAlexandru Elisei if (r < 0) {
909db927775SAlexandru Elisei free(ops);
910db927775SAlexandru Elisei return r;
911db927775SAlexandru Elisei }
91227ab67f5SSasha Levin
9139ed67cdcSSasha Levin if (params->vhost)
9149ed67cdcSSasha Levin virtio_net__vhost_init(params->kvm, ndev);
915cb83de6fSSasha Levin
9164498eb74SAlexandru Elisei if (compat_id == -1)
91752f34d2cSAsias He compat_id = virtio_compat_add_message("virtio-net", "CONFIG_VIRTIO_NET");
9185f225124SSasha Levin
9195f225124SSasha Levin return 0;
9205f225124SSasha Levin }
9215f225124SSasha Levin
virtio_net__init(struct kvm * kvm)9225f225124SSasha Levin int virtio_net__init(struct kvm *kvm)
9235f225124SSasha Levin {
924db927775SAlexandru Elisei int i, r;
9255f225124SSasha Levin
9265f225124SSasha Levin for (i = 0; i < kvm->cfg.num_net_devices; i++) {
9275f225124SSasha Levin kvm->cfg.net_params[i].kvm = kvm;
9284498eb74SAlexandru Elisei r = virtio_net__init_one(&kvm->cfg.net_params[i]);
929db927775SAlexandru Elisei if (r < 0)
930db927775SAlexandru Elisei goto cleanup;
9315f225124SSasha Levin }
9325f225124SSasha Levin
9335f225124SSasha Levin if (kvm->cfg.num_net_devices == 0 && kvm->cfg.no_net == 0) {
9348c0ae74dSSasha Levin static struct virtio_net_params net_params;
9355f225124SSasha Levin
9365f225124SSasha Levin net_params = (struct virtio_net_params) {
9375f225124SSasha Levin .guest_ip = kvm->cfg.guest_ip,
9385f225124SSasha Levin .host_ip = kvm->cfg.host_ip,
9395f225124SSasha Levin .kvm = kvm,
9405f225124SSasha Levin .script = kvm->cfg.script,
9415f225124SSasha Levin .mode = NET_MODE_USER,
9425f225124SSasha Levin };
9435f225124SSasha Levin str_to_mac(kvm->cfg.guest_mac, net_params.guest_mac);
9445f225124SSasha Levin str_to_mac(kvm->cfg.host_mac, net_params.host_mac);
9455f225124SSasha Levin
9464498eb74SAlexandru Elisei r = virtio_net__init_one(&net_params);
947db927775SAlexandru Elisei if (r < 0)
948db927775SAlexandru Elisei goto cleanup;
9495f225124SSasha Levin }
9505f225124SSasha Levin
9515f225124SSasha Levin return 0;
952db927775SAlexandru Elisei
953db927775SAlexandru Elisei cleanup:
954db927775SAlexandru Elisei virtio_net__exit(kvm);
955db927775SAlexandru Elisei return r;
9565f225124SSasha Levin }
95749a8afd1SSasha Levin virtio_dev_init(virtio_net__init);
9585f225124SSasha Levin
virtio_net__exit(struct kvm * kvm)9595f225124SSasha Levin int virtio_net__exit(struct kvm *kvm)
9605f225124SSasha Levin {
961eef27ae3SFan Du struct virtio_net_params *params;
962eef27ae3SFan Du struct net_dev *ndev;
963db927775SAlexandru Elisei struct list_head *ptr, *n;
964eef27ae3SFan Du
965db927775SAlexandru Elisei list_for_each_safe(ptr, n, &ndevs) {
966eef27ae3SFan Du ndev = list_entry(ptr, struct net_dev, list);
967eef27ae3SFan Du params = ndev->params;
968eef27ae3SFan Du /* Cleanup any tap device which attached to bridge */
969eef27ae3SFan Du if (ndev->mode == NET_MODE_TAP &&
970eef27ae3SFan Du strcmp(params->downscript, "none"))
971eef27ae3SFan Du virtio_net_exec_script(params->downscript, ndev->tap_name);
972*74af1456SEduardo Bart virtio_net_stop(ndev);
973db927775SAlexandru Elisei
974db927775SAlexandru Elisei list_del(&ndev->list);
975*74af1456SEduardo Bart virtio_exit(kvm, &ndev->vdev);
976db927775SAlexandru Elisei free(ndev);
977eef27ae3SFan Du }
978*74af1456SEduardo Bart
9795f225124SSasha Levin return 0;
9804f56d42cSAsias He }
98149a8afd1SSasha Levin virtio_dev_exit(virtio_net__exit);
982