1e263cd49SDmitry Fleytman /* 2605d52e6SDmitry Fleytman * QEMU TX packets abstractions 3e263cd49SDmitry Fleytman * 4e263cd49SDmitry Fleytman * Copyright (c) 2012 Ravello Systems LTD (http://ravellosystems.com) 5e263cd49SDmitry Fleytman * 6e263cd49SDmitry Fleytman * Developed by Daynix Computing LTD (http://www.daynix.com) 7e263cd49SDmitry Fleytman * 8e263cd49SDmitry Fleytman * Authors: 9e263cd49SDmitry Fleytman * Dmitry Fleytman <dmitry@daynix.com> 10e263cd49SDmitry Fleytman * Tamir Shomer <tamirs@daynix.com> 11e263cd49SDmitry Fleytman * Yan Vugenfirer <yan@daynix.com> 12e263cd49SDmitry Fleytman * 13e263cd49SDmitry Fleytman * This work is licensed under the terms of the GNU GPL, version 2 or later. 14e263cd49SDmitry Fleytman * See the COPYING file in the top-level directory. 15e263cd49SDmitry Fleytman * 16e263cd49SDmitry Fleytman */ 17e263cd49SDmitry Fleytman 18e9abfcb5SPaolo Bonzini #include "qemu/osdep.h" 19605d52e6SDmitry Fleytman #include "net_tx_pkt.h" 20e263cd49SDmitry Fleytman #include "net/eth.h" 21e263cd49SDmitry Fleytman #include "net/checksum.h" 22e263cd49SDmitry Fleytman #include "net/tap.h" 23e263cd49SDmitry Fleytman #include "net/net.h" 24edf5ca5dSMarkus Armbruster #include "hw/pci/pci_device.h" 25e263cd49SDmitry Fleytman 26e263cd49SDmitry Fleytman enum { 27605d52e6SDmitry Fleytman NET_TX_PKT_VHDR_FRAG = 0, 28605d52e6SDmitry Fleytman NET_TX_PKT_L2HDR_FRAG, 29605d52e6SDmitry Fleytman NET_TX_PKT_L3HDR_FRAG, 30605d52e6SDmitry Fleytman NET_TX_PKT_PL_START_FRAG 31e263cd49SDmitry Fleytman }; 32e263cd49SDmitry Fleytman 33e263cd49SDmitry Fleytman /* TX packet private context */ 34605d52e6SDmitry Fleytman struct NetTxPkt { 3511171010SDmitry Fleytman PCIDevice *pci_dev; 3611171010SDmitry Fleytman 37e263cd49SDmitry Fleytman struct virtio_net_hdr virt_hdr; 38e263cd49SDmitry Fleytman 39e263cd49SDmitry Fleytman struct iovec *raw; 40e263cd49SDmitry Fleytman uint32_t raw_frags; 41e263cd49SDmitry Fleytman uint32_t max_raw_frags; 42e263cd49SDmitry Fleytman 43e263cd49SDmitry Fleytman struct iovec *vec; 44e263cd49SDmitry Fleytman 45e263cd49SDmitry Fleytman uint8_t l2_hdr[ETH_MAX_L2_HDR_LEN]; 462a5f744eSAkihiko Odaki union { 472a5f744eSAkihiko Odaki struct ip_header ip; 482a5f744eSAkihiko Odaki struct ip6_header ip6; 492a5f744eSAkihiko Odaki uint8_t octets[ETH_MAX_IP_DGRAM_LEN]; 502a5f744eSAkihiko Odaki } l3_hdr; 51e263cd49SDmitry Fleytman 52e263cd49SDmitry Fleytman uint32_t payload_len; 53e263cd49SDmitry Fleytman 54e263cd49SDmitry Fleytman uint32_t payload_frags; 55e263cd49SDmitry Fleytman uint32_t max_payload_frags; 56e263cd49SDmitry Fleytman 57e263cd49SDmitry Fleytman uint16_t hdr_len; 58e263cd49SDmitry Fleytman eth_pkt_types_e packet_type; 59e263cd49SDmitry Fleytman uint8_t l4proto; 60e263cd49SDmitry Fleytman }; 61e263cd49SDmitry Fleytman 6211171010SDmitry Fleytman void net_tx_pkt_init(struct NetTxPkt **pkt, PCIDevice *pci_dev, 6355daf493SAkihiko Odaki uint32_t max_frags) 64e263cd49SDmitry Fleytman { 65605d52e6SDmitry Fleytman struct NetTxPkt *p = g_malloc0(sizeof *p); 66e263cd49SDmitry Fleytman 6711171010SDmitry Fleytman p->pci_dev = pci_dev; 6811171010SDmitry Fleytman 6947882fa4SLi Qiang p->vec = g_new(struct iovec, max_frags + NET_TX_PKT_PL_START_FRAG); 70e263cd49SDmitry Fleytman 7147882fa4SLi Qiang p->raw = g_new(struct iovec, max_frags); 72e263cd49SDmitry Fleytman 73e263cd49SDmitry Fleytman p->max_payload_frags = max_frags; 74e263cd49SDmitry Fleytman p->max_raw_frags = max_frags; 75605d52e6SDmitry Fleytman p->vec[NET_TX_PKT_VHDR_FRAG].iov_base = &p->virt_hdr; 7655daf493SAkihiko Odaki p->vec[NET_TX_PKT_VHDR_FRAG].iov_len = sizeof p->virt_hdr; 77605d52e6SDmitry Fleytman p->vec[NET_TX_PKT_L2HDR_FRAG].iov_base = &p->l2_hdr; 78eb700029SDmitry Fleytman p->vec[NET_TX_PKT_L3HDR_FRAG].iov_base = &p->l3_hdr; 79e263cd49SDmitry Fleytman 80e263cd49SDmitry Fleytman *pkt = p; 81e263cd49SDmitry Fleytman } 82e263cd49SDmitry Fleytman 83605d52e6SDmitry Fleytman void net_tx_pkt_uninit(struct NetTxPkt *pkt) 84e263cd49SDmitry Fleytman { 85e263cd49SDmitry Fleytman if (pkt) { 86e263cd49SDmitry Fleytman g_free(pkt->vec); 87e263cd49SDmitry Fleytman g_free(pkt->raw); 88e263cd49SDmitry Fleytman g_free(pkt); 89e263cd49SDmitry Fleytman } 90e263cd49SDmitry Fleytman } 91e263cd49SDmitry Fleytman 92eb700029SDmitry Fleytman void net_tx_pkt_update_ip_hdr_checksum(struct NetTxPkt *pkt) 93eb700029SDmitry Fleytman { 94eb700029SDmitry Fleytman uint16_t csum; 95eb700029SDmitry Fleytman assert(pkt); 96eb700029SDmitry Fleytman 972a5f744eSAkihiko Odaki pkt->l3_hdr.ip.ip_len = cpu_to_be16(pkt->payload_len + 98eb700029SDmitry Fleytman pkt->vec[NET_TX_PKT_L3HDR_FRAG].iov_len); 99eb700029SDmitry Fleytman 1002a5f744eSAkihiko Odaki pkt->l3_hdr.ip.ip_sum = 0; 1012a5f744eSAkihiko Odaki csum = net_raw_checksum(pkt->l3_hdr.octets, 102eb700029SDmitry Fleytman pkt->vec[NET_TX_PKT_L3HDR_FRAG].iov_len); 1032a5f744eSAkihiko Odaki pkt->l3_hdr.ip.ip_sum = cpu_to_be16(csum); 104eb700029SDmitry Fleytman } 105eb700029SDmitry Fleytman 106605d52e6SDmitry Fleytman void net_tx_pkt_update_ip_checksums(struct NetTxPkt *pkt) 107e263cd49SDmitry Fleytman { 108e263cd49SDmitry Fleytman uint16_t csum; 109eb700029SDmitry Fleytman uint32_t cntr, cso; 110e263cd49SDmitry Fleytman assert(pkt); 111e263cd49SDmitry Fleytman uint8_t gso_type = pkt->virt_hdr.gso_type & ~VIRTIO_NET_HDR_GSO_ECN; 112eb700029SDmitry Fleytman void *ip_hdr = pkt->vec[NET_TX_PKT_L3HDR_FRAG].iov_base; 113e263cd49SDmitry Fleytman 114605d52e6SDmitry Fleytman if (pkt->payload_len + pkt->vec[NET_TX_PKT_L3HDR_FRAG].iov_len > 115e263cd49SDmitry Fleytman ETH_MAX_IP_DGRAM_LEN) { 116e263cd49SDmitry Fleytman return; 117e263cd49SDmitry Fleytman } 118e263cd49SDmitry Fleytman 119eb700029SDmitry Fleytman if (gso_type == VIRTIO_NET_HDR_GSO_TCPV4 || 120eb700029SDmitry Fleytman gso_type == VIRTIO_NET_HDR_GSO_UDP) { 121e263cd49SDmitry Fleytman /* Calculate IP header checksum */ 122eb700029SDmitry Fleytman net_tx_pkt_update_ip_hdr_checksum(pkt); 123e263cd49SDmitry Fleytman 124e263cd49SDmitry Fleytman /* Calculate IP pseudo header checksum */ 125eb700029SDmitry Fleytman cntr = eth_calc_ip4_pseudo_hdr_csum(ip_hdr, pkt->payload_len, &cso); 126eb700029SDmitry Fleytman csum = cpu_to_be16(~net_checksum_finish(cntr)); 127eb700029SDmitry Fleytman } else if (gso_type == VIRTIO_NET_HDR_GSO_TCPV6) { 128eb700029SDmitry Fleytman /* Calculate IP pseudo header checksum */ 129eb700029SDmitry Fleytman cntr = eth_calc_ip6_pseudo_hdr_csum(ip_hdr, pkt->payload_len, 130eb700029SDmitry Fleytman IP_PROTO_TCP, &cso); 131eb700029SDmitry Fleytman csum = cpu_to_be16(~net_checksum_finish(cntr)); 132eb700029SDmitry Fleytman } else { 133eb700029SDmitry Fleytman return; 134eb700029SDmitry Fleytman } 135eb700029SDmitry Fleytman 136605d52e6SDmitry Fleytman iov_from_buf(&pkt->vec[NET_TX_PKT_PL_START_FRAG], pkt->payload_frags, 137e263cd49SDmitry Fleytman pkt->virt_hdr.csum_offset, &csum, sizeof(csum)); 138e263cd49SDmitry Fleytman } 139e263cd49SDmitry Fleytman 140605d52e6SDmitry Fleytman static void net_tx_pkt_calculate_hdr_len(struct NetTxPkt *pkt) 141e263cd49SDmitry Fleytman { 142605d52e6SDmitry Fleytman pkt->hdr_len = pkt->vec[NET_TX_PKT_L2HDR_FRAG].iov_len + 143605d52e6SDmitry Fleytman pkt->vec[NET_TX_PKT_L3HDR_FRAG].iov_len; 144e263cd49SDmitry Fleytman } 145e263cd49SDmitry Fleytman 146605d52e6SDmitry Fleytman static bool net_tx_pkt_parse_headers(struct NetTxPkt *pkt) 147e263cd49SDmitry Fleytman { 148e263cd49SDmitry Fleytman struct iovec *l2_hdr, *l3_hdr; 149e263cd49SDmitry Fleytman size_t bytes_read; 150e263cd49SDmitry Fleytman size_t full_ip6hdr_len; 151e263cd49SDmitry Fleytman uint16_t l3_proto; 152e263cd49SDmitry Fleytman 153e263cd49SDmitry Fleytman assert(pkt); 154e263cd49SDmitry Fleytman 155605d52e6SDmitry Fleytman l2_hdr = &pkt->vec[NET_TX_PKT_L2HDR_FRAG]; 156605d52e6SDmitry Fleytman l3_hdr = &pkt->vec[NET_TX_PKT_L3HDR_FRAG]; 157e263cd49SDmitry Fleytman 158e263cd49SDmitry Fleytman bytes_read = iov_to_buf(pkt->raw, pkt->raw_frags, 0, l2_hdr->iov_base, 159e263cd49SDmitry Fleytman ETH_MAX_L2_HDR_LEN); 160a7278b36SDana Rubin if (bytes_read < sizeof(struct eth_header)) { 161e263cd49SDmitry Fleytman l2_hdr->iov_len = 0; 162e263cd49SDmitry Fleytman return false; 163a7278b36SDana Rubin } 164a7278b36SDana Rubin 165a7278b36SDana Rubin l2_hdr->iov_len = sizeof(struct eth_header); 166a7278b36SDana Rubin switch (be16_to_cpu(PKT_GET_ETH_HDR(l2_hdr->iov_base)->h_proto)) { 167a7278b36SDana Rubin case ETH_P_VLAN: 168a7278b36SDana Rubin l2_hdr->iov_len += sizeof(struct vlan_header); 169a7278b36SDana Rubin break; 170a7278b36SDana Rubin case ETH_P_DVLAN: 171a7278b36SDana Rubin l2_hdr->iov_len += 2 * sizeof(struct vlan_header); 172a7278b36SDana Rubin break; 173a7278b36SDana Rubin } 174a7278b36SDana Rubin 175a7278b36SDana Rubin if (bytes_read < l2_hdr->iov_len) { 176a7278b36SDana Rubin l2_hdr->iov_len = 0; 177eb700029SDmitry Fleytman l3_hdr->iov_len = 0; 178eb700029SDmitry Fleytman pkt->packet_type = ETH_PKT_UCAST; 179a7278b36SDana Rubin return false; 180eb700029SDmitry Fleytman } else { 181eb700029SDmitry Fleytman l2_hdr->iov_len = ETH_MAX_L2_HDR_LEN; 182eb700029SDmitry Fleytman l2_hdr->iov_len = eth_get_l2_hdr_length(l2_hdr->iov_base); 183eb700029SDmitry Fleytman pkt->packet_type = get_eth_packet_type(l2_hdr->iov_base); 184e263cd49SDmitry Fleytman } 185e263cd49SDmitry Fleytman 186eb700029SDmitry Fleytman l3_proto = eth_get_l3_proto(l2_hdr, 1, l2_hdr->iov_len); 187e263cd49SDmitry Fleytman 188e263cd49SDmitry Fleytman switch (l3_proto) { 189e263cd49SDmitry Fleytman case ETH_P_IP: 190e263cd49SDmitry Fleytman bytes_read = iov_to_buf(pkt->raw, pkt->raw_frags, l2_hdr->iov_len, 191e263cd49SDmitry Fleytman l3_hdr->iov_base, sizeof(struct ip_header)); 192e263cd49SDmitry Fleytman 193e263cd49SDmitry Fleytman if (bytes_read < sizeof(struct ip_header)) { 194e263cd49SDmitry Fleytman l3_hdr->iov_len = 0; 195e263cd49SDmitry Fleytman return false; 196e263cd49SDmitry Fleytman } 197e263cd49SDmitry Fleytman 198e263cd49SDmitry Fleytman l3_hdr->iov_len = IP_HDR_GET_LEN(l3_hdr->iov_base); 199eb700029SDmitry Fleytman 200eb700029SDmitry Fleytman if (l3_hdr->iov_len < sizeof(struct ip_header)) { 201eb700029SDmitry Fleytman l3_hdr->iov_len = 0; 202eb700029SDmitry Fleytman return false; 203eb700029SDmitry Fleytman } 204eb700029SDmitry Fleytman 2054f51e1d3SMarc-André Lureau pkt->l4proto = IP_HDR_GET_P(l3_hdr->iov_base); 206e263cd49SDmitry Fleytman 207eb700029SDmitry Fleytman if (IP_HDR_GET_LEN(l3_hdr->iov_base) != sizeof(struct ip_header)) { 208eb700029SDmitry Fleytman /* copy optional IPv4 header data if any*/ 209e263cd49SDmitry Fleytman bytes_read = iov_to_buf(pkt->raw, pkt->raw_frags, 210e263cd49SDmitry Fleytman l2_hdr->iov_len + sizeof(struct ip_header), 211e263cd49SDmitry Fleytman l3_hdr->iov_base + sizeof(struct ip_header), 212e263cd49SDmitry Fleytman l3_hdr->iov_len - sizeof(struct ip_header)); 213e263cd49SDmitry Fleytman if (bytes_read < l3_hdr->iov_len - sizeof(struct ip_header)) { 214e263cd49SDmitry Fleytman l3_hdr->iov_len = 0; 215e263cd49SDmitry Fleytman return false; 216e263cd49SDmitry Fleytman } 217eb700029SDmitry Fleytman } 218eb700029SDmitry Fleytman 219e263cd49SDmitry Fleytman break; 220e263cd49SDmitry Fleytman 221e263cd49SDmitry Fleytman case ETH_P_IPV6: 222eb700029SDmitry Fleytman { 223eb700029SDmitry Fleytman eth_ip6_hdr_info hdrinfo; 224eb700029SDmitry Fleytman 225e263cd49SDmitry Fleytman if (!eth_parse_ipv6_hdr(pkt->raw, pkt->raw_frags, l2_hdr->iov_len, 226eb700029SDmitry Fleytman &hdrinfo)) { 227e263cd49SDmitry Fleytman l3_hdr->iov_len = 0; 228e263cd49SDmitry Fleytman return false; 229e263cd49SDmitry Fleytman } 230e263cd49SDmitry Fleytman 231eb700029SDmitry Fleytman pkt->l4proto = hdrinfo.l4proto; 232eb700029SDmitry Fleytman full_ip6hdr_len = hdrinfo.full_hdr_len; 233eb700029SDmitry Fleytman 234eb700029SDmitry Fleytman if (full_ip6hdr_len > ETH_MAX_IP_DGRAM_LEN) { 235eb700029SDmitry Fleytman l3_hdr->iov_len = 0; 236eb700029SDmitry Fleytman return false; 237eb700029SDmitry Fleytman } 238e263cd49SDmitry Fleytman 239e263cd49SDmitry Fleytman bytes_read = iov_to_buf(pkt->raw, pkt->raw_frags, l2_hdr->iov_len, 240e263cd49SDmitry Fleytman l3_hdr->iov_base, full_ip6hdr_len); 241e263cd49SDmitry Fleytman 242e263cd49SDmitry Fleytman if (bytes_read < full_ip6hdr_len) { 243e263cd49SDmitry Fleytman l3_hdr->iov_len = 0; 244e263cd49SDmitry Fleytman return false; 245e263cd49SDmitry Fleytman } else { 246e263cd49SDmitry Fleytman l3_hdr->iov_len = full_ip6hdr_len; 247e263cd49SDmitry Fleytman } 248e263cd49SDmitry Fleytman break; 249eb700029SDmitry Fleytman } 250e263cd49SDmitry Fleytman default: 251e263cd49SDmitry Fleytman l3_hdr->iov_len = 0; 252e263cd49SDmitry Fleytman break; 253e263cd49SDmitry Fleytman } 254e263cd49SDmitry Fleytman 255605d52e6SDmitry Fleytman net_tx_pkt_calculate_hdr_len(pkt); 256e263cd49SDmitry Fleytman return true; 257e263cd49SDmitry Fleytman } 258e263cd49SDmitry Fleytman 259eb700029SDmitry Fleytman static void net_tx_pkt_rebuild_payload(struct NetTxPkt *pkt) 260e263cd49SDmitry Fleytman { 261eb700029SDmitry Fleytman pkt->payload_len = iov_size(pkt->raw, pkt->raw_frags) - pkt->hdr_len; 262605d52e6SDmitry Fleytman pkt->payload_frags = iov_copy(&pkt->vec[NET_TX_PKT_PL_START_FRAG], 263e263cd49SDmitry Fleytman pkt->max_payload_frags, 264e263cd49SDmitry Fleytman pkt->raw, pkt->raw_frags, 265eb700029SDmitry Fleytman pkt->hdr_len, pkt->payload_len); 266e263cd49SDmitry Fleytman } 267e263cd49SDmitry Fleytman 268605d52e6SDmitry Fleytman bool net_tx_pkt_parse(struct NetTxPkt *pkt) 269e263cd49SDmitry Fleytman { 270eb700029SDmitry Fleytman if (net_tx_pkt_parse_headers(pkt)) { 271605d52e6SDmitry Fleytman net_tx_pkt_rebuild_payload(pkt); 272eb700029SDmitry Fleytman return true; 273eb700029SDmitry Fleytman } else { 274eb700029SDmitry Fleytman return false; 275eb700029SDmitry Fleytman } 276e263cd49SDmitry Fleytman } 277e263cd49SDmitry Fleytman 278605d52e6SDmitry Fleytman struct virtio_net_hdr *net_tx_pkt_get_vhdr(struct NetTxPkt *pkt) 279e263cd49SDmitry Fleytman { 280e263cd49SDmitry Fleytman assert(pkt); 281e263cd49SDmitry Fleytman return &pkt->virt_hdr; 282e263cd49SDmitry Fleytman } 283e263cd49SDmitry Fleytman 284605d52e6SDmitry Fleytman static uint8_t net_tx_pkt_get_gso_type(struct NetTxPkt *pkt, 285e263cd49SDmitry Fleytman bool tso_enable) 286e263cd49SDmitry Fleytman { 287e263cd49SDmitry Fleytman uint8_t rc = VIRTIO_NET_HDR_GSO_NONE; 288e263cd49SDmitry Fleytman uint16_t l3_proto; 289e263cd49SDmitry Fleytman 290eb700029SDmitry Fleytman l3_proto = eth_get_l3_proto(&pkt->vec[NET_TX_PKT_L2HDR_FRAG], 1, 291605d52e6SDmitry Fleytman pkt->vec[NET_TX_PKT_L2HDR_FRAG].iov_len); 292e263cd49SDmitry Fleytman 293e263cd49SDmitry Fleytman if (!tso_enable) { 294e263cd49SDmitry Fleytman goto func_exit; 295e263cd49SDmitry Fleytman } 296e263cd49SDmitry Fleytman 297605d52e6SDmitry Fleytman rc = eth_get_gso_type(l3_proto, pkt->vec[NET_TX_PKT_L3HDR_FRAG].iov_base, 298e263cd49SDmitry Fleytman pkt->l4proto); 299e263cd49SDmitry Fleytman 300e263cd49SDmitry Fleytman func_exit: 301e263cd49SDmitry Fleytman return rc; 302e263cd49SDmitry Fleytman } 303e263cd49SDmitry Fleytman 304f9a9eb16SAkihiko Odaki bool net_tx_pkt_build_vheader(struct NetTxPkt *pkt, bool tso_enable, 305e263cd49SDmitry Fleytman bool csum_enable, uint32_t gso_size) 306e263cd49SDmitry Fleytman { 307e263cd49SDmitry Fleytman struct tcp_hdr l4hdr; 308f9a9eb16SAkihiko Odaki size_t bytes_read; 309e263cd49SDmitry Fleytman assert(pkt); 310e263cd49SDmitry Fleytman 311e263cd49SDmitry Fleytman /* csum has to be enabled if tso is. */ 312e263cd49SDmitry Fleytman assert(csum_enable || !tso_enable); 313e263cd49SDmitry Fleytman 314605d52e6SDmitry Fleytman pkt->virt_hdr.gso_type = net_tx_pkt_get_gso_type(pkt, tso_enable); 315e263cd49SDmitry Fleytman 316e263cd49SDmitry Fleytman switch (pkt->virt_hdr.gso_type & ~VIRTIO_NET_HDR_GSO_ECN) { 317e263cd49SDmitry Fleytman case VIRTIO_NET_HDR_GSO_NONE: 318e263cd49SDmitry Fleytman pkt->virt_hdr.hdr_len = 0; 319e263cd49SDmitry Fleytman pkt->virt_hdr.gso_size = 0; 320e263cd49SDmitry Fleytman break; 321e263cd49SDmitry Fleytman 322e263cd49SDmitry Fleytman case VIRTIO_NET_HDR_GSO_UDP: 323eb700029SDmitry Fleytman pkt->virt_hdr.gso_size = gso_size; 324e263cd49SDmitry Fleytman pkt->virt_hdr.hdr_len = pkt->hdr_len + sizeof(struct udp_header); 325e263cd49SDmitry Fleytman break; 326e263cd49SDmitry Fleytman 327e263cd49SDmitry Fleytman case VIRTIO_NET_HDR_GSO_TCPV4: 328e263cd49SDmitry Fleytman case VIRTIO_NET_HDR_GSO_TCPV6: 329f9a9eb16SAkihiko Odaki bytes_read = iov_to_buf(&pkt->vec[NET_TX_PKT_PL_START_FRAG], 330f9a9eb16SAkihiko Odaki pkt->payload_frags, 0, &l4hdr, sizeof(l4hdr)); 33102ef5fdcSAkihiko Odaki if (bytes_read < sizeof(l4hdr) || 33202ef5fdcSAkihiko Odaki l4hdr.th_off * sizeof(uint32_t) < sizeof(l4hdr)) { 333f9a9eb16SAkihiko Odaki return false; 334f9a9eb16SAkihiko Odaki } 335f9a9eb16SAkihiko Odaki 336e263cd49SDmitry Fleytman pkt->virt_hdr.hdr_len = pkt->hdr_len + l4hdr.th_off * sizeof(uint32_t); 337eb700029SDmitry Fleytman pkt->virt_hdr.gso_size = gso_size; 338e263cd49SDmitry Fleytman break; 339e263cd49SDmitry Fleytman 340e263cd49SDmitry Fleytman default: 341dfc6f865SStefan Weil g_assert_not_reached(); 342e263cd49SDmitry Fleytman } 343e263cd49SDmitry Fleytman 344e263cd49SDmitry Fleytman if (csum_enable) { 345e263cd49SDmitry Fleytman switch (pkt->l4proto) { 346e263cd49SDmitry Fleytman case IP_PROTO_TCP: 347dd32b5eaSAkihiko Odaki if (pkt->payload_len < sizeof(struct tcp_hdr)) { 348dd32b5eaSAkihiko Odaki return false; 349dd32b5eaSAkihiko Odaki } 350e263cd49SDmitry Fleytman pkt->virt_hdr.flags = VIRTIO_NET_HDR_F_NEEDS_CSUM; 351e263cd49SDmitry Fleytman pkt->virt_hdr.csum_start = pkt->hdr_len; 352e263cd49SDmitry Fleytman pkt->virt_hdr.csum_offset = offsetof(struct tcp_hdr, th_sum); 353e263cd49SDmitry Fleytman break; 354e263cd49SDmitry Fleytman case IP_PROTO_UDP: 355dd32b5eaSAkihiko Odaki if (pkt->payload_len < sizeof(struct udp_hdr)) { 356dd32b5eaSAkihiko Odaki return false; 357dd32b5eaSAkihiko Odaki } 358e263cd49SDmitry Fleytman pkt->virt_hdr.flags = VIRTIO_NET_HDR_F_NEEDS_CSUM; 359e263cd49SDmitry Fleytman pkt->virt_hdr.csum_start = pkt->hdr_len; 360e263cd49SDmitry Fleytman pkt->virt_hdr.csum_offset = offsetof(struct udp_hdr, uh_sum); 361e263cd49SDmitry Fleytman break; 362e263cd49SDmitry Fleytman default: 363e263cd49SDmitry Fleytman break; 364e263cd49SDmitry Fleytman } 365e263cd49SDmitry Fleytman } 366f9a9eb16SAkihiko Odaki 367f9a9eb16SAkihiko Odaki return true; 368e263cd49SDmitry Fleytman } 369e263cd49SDmitry Fleytman 370eb700029SDmitry Fleytman void net_tx_pkt_setup_vlan_header_ex(struct NetTxPkt *pkt, 371eb700029SDmitry Fleytman uint16_t vlan, uint16_t vlan_ethtype) 372e263cd49SDmitry Fleytman { 373e263cd49SDmitry Fleytman bool is_new; 374e263cd49SDmitry Fleytman assert(pkt); 375e263cd49SDmitry Fleytman 376eb700029SDmitry Fleytman eth_setup_vlan_headers_ex(pkt->vec[NET_TX_PKT_L2HDR_FRAG].iov_base, 377eb700029SDmitry Fleytman vlan, vlan_ethtype, &is_new); 378e263cd49SDmitry Fleytman 379e263cd49SDmitry Fleytman /* update l2hdrlen */ 380e263cd49SDmitry Fleytman if (is_new) { 381e263cd49SDmitry Fleytman pkt->hdr_len += sizeof(struct vlan_header); 382605d52e6SDmitry Fleytman pkt->vec[NET_TX_PKT_L2HDR_FRAG].iov_len += 383e263cd49SDmitry Fleytman sizeof(struct vlan_header); 384e263cd49SDmitry Fleytman } 385e263cd49SDmitry Fleytman } 386e263cd49SDmitry Fleytman 387*163246e1SAkihiko Odaki static bool net_tx_pkt_add_raw_fragment_common(struct NetTxPkt *pkt, 388*163246e1SAkihiko Odaki void *base, size_t len) 389e263cd49SDmitry Fleytman { 390e263cd49SDmitry Fleytman struct iovec *ventry; 391e263cd49SDmitry Fleytman assert(pkt); 392035e69b0SMauro Matteo Cascella 393035e69b0SMauro Matteo Cascella if (pkt->raw_frags >= pkt->max_raw_frags) { 394035e69b0SMauro Matteo Cascella return false; 395035e69b0SMauro Matteo Cascella } 396e263cd49SDmitry Fleytman 397e263cd49SDmitry Fleytman ventry = &pkt->raw[pkt->raw_frags]; 398*163246e1SAkihiko Odaki ventry->iov_base = base; 399*163246e1SAkihiko Odaki ventry->iov_len = len; 400eb700029SDmitry Fleytman pkt->raw_frags++; 401*163246e1SAkihiko Odaki 402eb700029SDmitry Fleytman return true; 403eb700029SDmitry Fleytman } 404e263cd49SDmitry Fleytman 405eb700029SDmitry Fleytman bool net_tx_pkt_has_fragments(struct NetTxPkt *pkt) 406eb700029SDmitry Fleytman { 407eb700029SDmitry Fleytman return pkt->raw_frags > 0; 408e263cd49SDmitry Fleytman } 409e263cd49SDmitry Fleytman 410605d52e6SDmitry Fleytman eth_pkt_types_e net_tx_pkt_get_packet_type(struct NetTxPkt *pkt) 411e263cd49SDmitry Fleytman { 412e263cd49SDmitry Fleytman assert(pkt); 413e263cd49SDmitry Fleytman 414e263cd49SDmitry Fleytman return pkt->packet_type; 415e263cd49SDmitry Fleytman } 416e263cd49SDmitry Fleytman 417605d52e6SDmitry Fleytman size_t net_tx_pkt_get_total_len(struct NetTxPkt *pkt) 418e263cd49SDmitry Fleytman { 419e263cd49SDmitry Fleytman assert(pkt); 420e263cd49SDmitry Fleytman 421e263cd49SDmitry Fleytman return pkt->hdr_len + pkt->payload_len; 422e263cd49SDmitry Fleytman } 423e263cd49SDmitry Fleytman 424605d52e6SDmitry Fleytman void net_tx_pkt_dump(struct NetTxPkt *pkt) 425e263cd49SDmitry Fleytman { 426605d52e6SDmitry Fleytman #ifdef NET_TX_PKT_DEBUG 427e263cd49SDmitry Fleytman assert(pkt); 428e263cd49SDmitry Fleytman 429e263cd49SDmitry Fleytman printf("TX PKT: hdr_len: %d, pkt_type: 0x%X, l2hdr_len: %lu, " 430e263cd49SDmitry Fleytman "l3hdr_len: %lu, payload_len: %u\n", pkt->hdr_len, pkt->packet_type, 431605d52e6SDmitry Fleytman pkt->vec[NET_TX_PKT_L2HDR_FRAG].iov_len, 432605d52e6SDmitry Fleytman pkt->vec[NET_TX_PKT_L3HDR_FRAG].iov_len, pkt->payload_len); 433e263cd49SDmitry Fleytman #endif 434e263cd49SDmitry Fleytman } 435e263cd49SDmitry Fleytman 436f4fdaf00SAkihiko Odaki void net_tx_pkt_reset(struct NetTxPkt *pkt, PCIDevice *pci_dev) 437e263cd49SDmitry Fleytman { 438e263cd49SDmitry Fleytman int i; 439e263cd49SDmitry Fleytman 440e263cd49SDmitry Fleytman /* no assert, as reset can be called before tx_pkt_init */ 441e263cd49SDmitry Fleytman if (!pkt) { 442e263cd49SDmitry Fleytman return; 443e263cd49SDmitry Fleytman } 444e263cd49SDmitry Fleytman 445e263cd49SDmitry Fleytman memset(&pkt->virt_hdr, 0, sizeof(pkt->virt_hdr)); 446e263cd49SDmitry Fleytman 447e263cd49SDmitry Fleytman assert(pkt->vec); 448eb700029SDmitry Fleytman 449e263cd49SDmitry Fleytman pkt->payload_len = 0; 450e263cd49SDmitry Fleytman pkt->payload_frags = 0; 451e263cd49SDmitry Fleytman 452283f0a05SThomas Huth if (pkt->max_raw_frags > 0) { 453e263cd49SDmitry Fleytman assert(pkt->raw); 454e263cd49SDmitry Fleytman for (i = 0; i < pkt->raw_frags; i++) { 455e263cd49SDmitry Fleytman assert(pkt->raw[i].iov_base); 456*163246e1SAkihiko Odaki net_tx_pkt_unmap_frag_pci(pkt->pci_dev, 457*163246e1SAkihiko Odaki pkt->raw[i].iov_base, 458*163246e1SAkihiko Odaki pkt->raw[i].iov_len); 459283f0a05SThomas Huth } 460e263cd49SDmitry Fleytman } 461f4fdaf00SAkihiko Odaki pkt->pci_dev = pci_dev; 462e263cd49SDmitry Fleytman pkt->raw_frags = 0; 463e263cd49SDmitry Fleytman 464e263cd49SDmitry Fleytman pkt->hdr_len = 0; 465e263cd49SDmitry Fleytman pkt->l4proto = 0; 466e263cd49SDmitry Fleytman } 467e263cd49SDmitry Fleytman 468*163246e1SAkihiko Odaki void net_tx_pkt_unmap_frag_pci(void *context, void *base, size_t len) 469*163246e1SAkihiko Odaki { 470*163246e1SAkihiko Odaki pci_dma_unmap(context, base, len, DMA_DIRECTION_TO_DEVICE, 0); 471*163246e1SAkihiko Odaki } 472*163246e1SAkihiko Odaki 473*163246e1SAkihiko Odaki bool net_tx_pkt_add_raw_fragment(struct NetTxPkt *pkt, hwaddr pa, 474*163246e1SAkihiko Odaki size_t len) 475*163246e1SAkihiko Odaki { 476*163246e1SAkihiko Odaki dma_addr_t mapped_len = len; 477*163246e1SAkihiko Odaki void *base = pci_dma_map(pkt->pci_dev, pa, &mapped_len, 478*163246e1SAkihiko Odaki DMA_DIRECTION_TO_DEVICE); 479*163246e1SAkihiko Odaki if (!base) { 480*163246e1SAkihiko Odaki return false; 481*163246e1SAkihiko Odaki } 482*163246e1SAkihiko Odaki 483*163246e1SAkihiko Odaki if (mapped_len != len || 484*163246e1SAkihiko Odaki !net_tx_pkt_add_raw_fragment_common(pkt, base, len)) { 485*163246e1SAkihiko Odaki net_tx_pkt_unmap_frag_pci(pkt->pci_dev, base, mapped_len); 486*163246e1SAkihiko Odaki return false; 487*163246e1SAkihiko Odaki } 488*163246e1SAkihiko Odaki 489*163246e1SAkihiko Odaki return true; 490*163246e1SAkihiko Odaki } 491*163246e1SAkihiko Odaki 49202ef5fdcSAkihiko Odaki static void net_tx_pkt_do_sw_csum(struct NetTxPkt *pkt, 49302ef5fdcSAkihiko Odaki struct iovec *iov, uint32_t iov_len, 49402ef5fdcSAkihiko Odaki uint16_t csl) 495e263cd49SDmitry Fleytman { 496e263cd49SDmitry Fleytman uint32_t csum_cntr; 497e263cd49SDmitry Fleytman uint16_t csum = 0; 498eb700029SDmitry Fleytman uint32_t cso; 499e263cd49SDmitry Fleytman /* num of iovec without vhdr */ 500e263cd49SDmitry Fleytman size_t csum_offset = pkt->virt_hdr.csum_start + pkt->virt_hdr.csum_offset; 5019a8d9492SAndrew uint16_t l3_proto = eth_get_l3_proto(iov, 1, iov->iov_len); 502e263cd49SDmitry Fleytman 503e263cd49SDmitry Fleytman /* Put zero to checksum field */ 504e263cd49SDmitry Fleytman iov_from_buf(iov, iov_len, csum_offset, &csum, sizeof csum); 505e263cd49SDmitry Fleytman 506e263cd49SDmitry Fleytman /* Calculate L4 TCP/UDP checksum */ 5079a8d9492SAndrew csum_cntr = 0; 5089a8d9492SAndrew cso = 0; 509e263cd49SDmitry Fleytman /* add pseudo header to csum */ 5109a8d9492SAndrew if (l3_proto == ETH_P_IP) { 5119a8d9492SAndrew csum_cntr = eth_calc_ip4_pseudo_hdr_csum( 5129a8d9492SAndrew pkt->vec[NET_TX_PKT_L3HDR_FRAG].iov_base, 5139a8d9492SAndrew csl, &cso); 5149a8d9492SAndrew } else if (l3_proto == ETH_P_IPV6) { 5159a8d9492SAndrew csum_cntr = eth_calc_ip6_pseudo_hdr_csum( 5169a8d9492SAndrew pkt->vec[NET_TX_PKT_L3HDR_FRAG].iov_base, 5179a8d9492SAndrew csl, pkt->l4proto, &cso); 5189a8d9492SAndrew } 519eb700029SDmitry Fleytman 520eb700029SDmitry Fleytman /* data checksum */ 521eb700029SDmitry Fleytman csum_cntr += 522eb700029SDmitry Fleytman net_checksum_add_iov(iov, iov_len, pkt->virt_hdr.csum_start, csl, cso); 523e263cd49SDmitry Fleytman 524e263cd49SDmitry Fleytman /* Put the checksum obtained into the packet */ 5250dacea92SEd Swierk csum = cpu_to_be16(net_checksum_finish_nozero(csum_cntr)); 526e263cd49SDmitry Fleytman iov_from_buf(iov, iov_len, csum_offset, &csum, sizeof csum); 527e263cd49SDmitry Fleytman } 528e263cd49SDmitry Fleytman 529605d52e6SDmitry Fleytman #define NET_MAX_FRAG_SG_LIST (64) 530e263cd49SDmitry Fleytman 531605d52e6SDmitry Fleytman static size_t net_tx_pkt_fetch_fragment(struct NetTxPkt *pkt, 53202ef5fdcSAkihiko Odaki int *src_idx, size_t *src_offset, size_t src_len, 53302ef5fdcSAkihiko Odaki struct iovec *dst, int *dst_idx) 534e263cd49SDmitry Fleytman { 535e263cd49SDmitry Fleytman size_t fetched = 0; 536e263cd49SDmitry Fleytman struct iovec *src = pkt->vec; 537e263cd49SDmitry Fleytman 53802ef5fdcSAkihiko Odaki while (fetched < src_len) { 539e263cd49SDmitry Fleytman 540e263cd49SDmitry Fleytman /* no more place in fragment iov */ 541605d52e6SDmitry Fleytman if (*dst_idx == NET_MAX_FRAG_SG_LIST) { 542e263cd49SDmitry Fleytman break; 543e263cd49SDmitry Fleytman } 544e263cd49SDmitry Fleytman 545e263cd49SDmitry Fleytman /* no more data in iovec */ 546605d52e6SDmitry Fleytman if (*src_idx == (pkt->payload_frags + NET_TX_PKT_PL_START_FRAG)) { 547e263cd49SDmitry Fleytman break; 548e263cd49SDmitry Fleytman } 549e263cd49SDmitry Fleytman 550e263cd49SDmitry Fleytman 551e263cd49SDmitry Fleytman dst[*dst_idx].iov_base = src[*src_idx].iov_base + *src_offset; 552e263cd49SDmitry Fleytman dst[*dst_idx].iov_len = MIN(src[*src_idx].iov_len - *src_offset, 55302ef5fdcSAkihiko Odaki src_len - fetched); 554e263cd49SDmitry Fleytman 555e263cd49SDmitry Fleytman *src_offset += dst[*dst_idx].iov_len; 556e263cd49SDmitry Fleytman fetched += dst[*dst_idx].iov_len; 557e263cd49SDmitry Fleytman 558e263cd49SDmitry Fleytman if (*src_offset == src[*src_idx].iov_len) { 559e263cd49SDmitry Fleytman *src_offset = 0; 560e263cd49SDmitry Fleytman (*src_idx)++; 561e263cd49SDmitry Fleytman } 562e263cd49SDmitry Fleytman 563e263cd49SDmitry Fleytman (*dst_idx)++; 564e263cd49SDmitry Fleytman } 565e263cd49SDmitry Fleytman 566e263cd49SDmitry Fleytman return fetched; 567e263cd49SDmitry Fleytman } 568e263cd49SDmitry Fleytman 569ffbd2dbdSAkihiko Odaki static void net_tx_pkt_sendv( 570ffbd2dbdSAkihiko Odaki void *opaque, const struct iovec *iov, int iov_cnt, 571ffbd2dbdSAkihiko Odaki const struct iovec *virt_iov, int virt_iov_cnt) 572eb700029SDmitry Fleytman { 573ffbd2dbdSAkihiko Odaki NetClientState *nc = opaque; 574ffbd2dbdSAkihiko Odaki 575ffbd2dbdSAkihiko Odaki if (qemu_get_using_vnet_hdr(nc->peer)) { 576ffbd2dbdSAkihiko Odaki qemu_sendv_packet(nc, virt_iov, virt_iov_cnt); 577eb700029SDmitry Fleytman } else { 578eb700029SDmitry Fleytman qemu_sendv_packet(nc, iov, iov_cnt); 579eb700029SDmitry Fleytman } 580eb700029SDmitry Fleytman } 581eb700029SDmitry Fleytman 58202ef5fdcSAkihiko Odaki static bool net_tx_pkt_tcp_fragment_init(struct NetTxPkt *pkt, 58302ef5fdcSAkihiko Odaki struct iovec *fragment, 58402ef5fdcSAkihiko Odaki int *pl_idx, 58502ef5fdcSAkihiko Odaki size_t *l4hdr_len, 58602ef5fdcSAkihiko Odaki int *src_idx, 58702ef5fdcSAkihiko Odaki size_t *src_offset, 58802ef5fdcSAkihiko Odaki size_t *src_len) 58902ef5fdcSAkihiko Odaki { 59002ef5fdcSAkihiko Odaki struct iovec *l4 = fragment + NET_TX_PKT_PL_START_FRAG; 59102ef5fdcSAkihiko Odaki size_t bytes_read = 0; 59202ef5fdcSAkihiko Odaki struct tcp_hdr *th; 59302ef5fdcSAkihiko Odaki 59402ef5fdcSAkihiko Odaki if (!pkt->payload_frags) { 59502ef5fdcSAkihiko Odaki return false; 59602ef5fdcSAkihiko Odaki } 59702ef5fdcSAkihiko Odaki 59802ef5fdcSAkihiko Odaki l4->iov_len = pkt->virt_hdr.hdr_len - pkt->hdr_len; 59902ef5fdcSAkihiko Odaki l4->iov_base = g_malloc(l4->iov_len); 60002ef5fdcSAkihiko Odaki 60102ef5fdcSAkihiko Odaki *src_idx = NET_TX_PKT_PL_START_FRAG; 60202ef5fdcSAkihiko Odaki while (pkt->vec[*src_idx].iov_len < l4->iov_len - bytes_read) { 60302ef5fdcSAkihiko Odaki memcpy((char *)l4->iov_base + bytes_read, pkt->vec[*src_idx].iov_base, 60402ef5fdcSAkihiko Odaki pkt->vec[*src_idx].iov_len); 60502ef5fdcSAkihiko Odaki 60602ef5fdcSAkihiko Odaki bytes_read += pkt->vec[*src_idx].iov_len; 60702ef5fdcSAkihiko Odaki 60802ef5fdcSAkihiko Odaki (*src_idx)++; 60902ef5fdcSAkihiko Odaki if (*src_idx >= pkt->payload_frags + NET_TX_PKT_PL_START_FRAG) { 61002ef5fdcSAkihiko Odaki g_free(l4->iov_base); 61102ef5fdcSAkihiko Odaki return false; 61202ef5fdcSAkihiko Odaki } 61302ef5fdcSAkihiko Odaki } 61402ef5fdcSAkihiko Odaki 61502ef5fdcSAkihiko Odaki *src_offset = l4->iov_len - bytes_read; 61602ef5fdcSAkihiko Odaki memcpy((char *)l4->iov_base + bytes_read, pkt->vec[*src_idx].iov_base, 61702ef5fdcSAkihiko Odaki *src_offset); 61802ef5fdcSAkihiko Odaki 61902ef5fdcSAkihiko Odaki th = l4->iov_base; 62002ef5fdcSAkihiko Odaki th->th_flags &= ~(TH_FIN | TH_PUSH); 62102ef5fdcSAkihiko Odaki 62202ef5fdcSAkihiko Odaki *pl_idx = NET_TX_PKT_PL_START_FRAG + 1; 62302ef5fdcSAkihiko Odaki *l4hdr_len = l4->iov_len; 62402ef5fdcSAkihiko Odaki *src_len = pkt->virt_hdr.gso_size; 62502ef5fdcSAkihiko Odaki 62602ef5fdcSAkihiko Odaki return true; 62702ef5fdcSAkihiko Odaki } 62802ef5fdcSAkihiko Odaki 62902ef5fdcSAkihiko Odaki static void net_tx_pkt_tcp_fragment_deinit(struct iovec *fragment) 63002ef5fdcSAkihiko Odaki { 63102ef5fdcSAkihiko Odaki g_free(fragment[NET_TX_PKT_PL_START_FRAG].iov_base); 63202ef5fdcSAkihiko Odaki } 63302ef5fdcSAkihiko Odaki 63402ef5fdcSAkihiko Odaki static void net_tx_pkt_tcp_fragment_fix(struct NetTxPkt *pkt, 63502ef5fdcSAkihiko Odaki struct iovec *fragment, 63602ef5fdcSAkihiko Odaki size_t fragment_len, 63702ef5fdcSAkihiko Odaki uint8_t gso_type) 63802ef5fdcSAkihiko Odaki { 63902ef5fdcSAkihiko Odaki struct iovec *l3hdr = fragment + NET_TX_PKT_L3HDR_FRAG; 64002ef5fdcSAkihiko Odaki struct iovec *l4hdr = fragment + NET_TX_PKT_PL_START_FRAG; 64102ef5fdcSAkihiko Odaki struct ip_header *ip = l3hdr->iov_base; 64202ef5fdcSAkihiko Odaki struct ip6_header *ip6 = l3hdr->iov_base; 64302ef5fdcSAkihiko Odaki size_t len = l3hdr->iov_len + l4hdr->iov_len + fragment_len; 64402ef5fdcSAkihiko Odaki 64502ef5fdcSAkihiko Odaki switch (gso_type) { 64602ef5fdcSAkihiko Odaki case VIRTIO_NET_HDR_GSO_TCPV4: 64702ef5fdcSAkihiko Odaki ip->ip_len = cpu_to_be16(len); 64802ef5fdcSAkihiko Odaki eth_fix_ip4_checksum(l3hdr->iov_base, l3hdr->iov_len); 64902ef5fdcSAkihiko Odaki break; 65002ef5fdcSAkihiko Odaki 65102ef5fdcSAkihiko Odaki case VIRTIO_NET_HDR_GSO_TCPV6: 65202ef5fdcSAkihiko Odaki len -= sizeof(struct ip6_header); 65302ef5fdcSAkihiko Odaki ip6->ip6_ctlun.ip6_un1.ip6_un1_plen = cpu_to_be16(len); 65402ef5fdcSAkihiko Odaki break; 65502ef5fdcSAkihiko Odaki } 65602ef5fdcSAkihiko Odaki } 65702ef5fdcSAkihiko Odaki 65802ef5fdcSAkihiko Odaki static void net_tx_pkt_tcp_fragment_advance(struct NetTxPkt *pkt, 65902ef5fdcSAkihiko Odaki struct iovec *fragment, 66002ef5fdcSAkihiko Odaki size_t fragment_len, 66102ef5fdcSAkihiko Odaki uint8_t gso_type) 66202ef5fdcSAkihiko Odaki { 66302ef5fdcSAkihiko Odaki struct iovec *l3hdr = fragment + NET_TX_PKT_L3HDR_FRAG; 66402ef5fdcSAkihiko Odaki struct iovec *l4hdr = fragment + NET_TX_PKT_PL_START_FRAG; 66502ef5fdcSAkihiko Odaki struct ip_header *ip = l3hdr->iov_base; 66602ef5fdcSAkihiko Odaki struct tcp_hdr *th = l4hdr->iov_base; 66702ef5fdcSAkihiko Odaki 66802ef5fdcSAkihiko Odaki if (gso_type == VIRTIO_NET_HDR_GSO_TCPV4) { 66902ef5fdcSAkihiko Odaki ip->ip_id = cpu_to_be16(be16_to_cpu(ip->ip_id) + 1); 67002ef5fdcSAkihiko Odaki } 67102ef5fdcSAkihiko Odaki 67202ef5fdcSAkihiko Odaki th->th_seq = cpu_to_be32(be32_to_cpu(th->th_seq) + fragment_len); 67302ef5fdcSAkihiko Odaki th->th_flags &= ~TH_CWR; 67402ef5fdcSAkihiko Odaki } 67502ef5fdcSAkihiko Odaki 67602ef5fdcSAkihiko Odaki static void net_tx_pkt_udp_fragment_init(struct NetTxPkt *pkt, 67702ef5fdcSAkihiko Odaki int *pl_idx, 67802ef5fdcSAkihiko Odaki size_t *l4hdr_len, 67902ef5fdcSAkihiko Odaki int *src_idx, size_t *src_offset, 68002ef5fdcSAkihiko Odaki size_t *src_len) 68102ef5fdcSAkihiko Odaki { 68202ef5fdcSAkihiko Odaki *pl_idx = NET_TX_PKT_PL_START_FRAG; 68302ef5fdcSAkihiko Odaki *l4hdr_len = 0; 68402ef5fdcSAkihiko Odaki *src_idx = NET_TX_PKT_PL_START_FRAG; 68502ef5fdcSAkihiko Odaki *src_offset = 0; 68602ef5fdcSAkihiko Odaki *src_len = IP_FRAG_ALIGN_SIZE(pkt->virt_hdr.gso_size); 68702ef5fdcSAkihiko Odaki } 68802ef5fdcSAkihiko Odaki 68902ef5fdcSAkihiko Odaki static void net_tx_pkt_udp_fragment_fix(struct NetTxPkt *pkt, 69002ef5fdcSAkihiko Odaki struct iovec *fragment, 69102ef5fdcSAkihiko Odaki size_t fragment_offset, 69202ef5fdcSAkihiko Odaki size_t fragment_len) 69302ef5fdcSAkihiko Odaki { 69402ef5fdcSAkihiko Odaki bool more_frags = fragment_offset + fragment_len < pkt->payload_len; 69502ef5fdcSAkihiko Odaki uint16_t orig_flags; 69602ef5fdcSAkihiko Odaki struct iovec *l3hdr = fragment + NET_TX_PKT_L3HDR_FRAG; 69702ef5fdcSAkihiko Odaki struct ip_header *ip = l3hdr->iov_base; 69802ef5fdcSAkihiko Odaki uint16_t frag_off_units = fragment_offset / IP_FRAG_UNIT_SIZE; 69902ef5fdcSAkihiko Odaki uint16_t new_ip_off; 70002ef5fdcSAkihiko Odaki 70102ef5fdcSAkihiko Odaki assert(fragment_offset % IP_FRAG_UNIT_SIZE == 0); 70202ef5fdcSAkihiko Odaki assert((frag_off_units & ~IP_OFFMASK) == 0); 70302ef5fdcSAkihiko Odaki 70402ef5fdcSAkihiko Odaki orig_flags = be16_to_cpu(ip->ip_off) & ~(IP_OFFMASK | IP_MF); 70502ef5fdcSAkihiko Odaki new_ip_off = frag_off_units | orig_flags | (more_frags ? IP_MF : 0); 70602ef5fdcSAkihiko Odaki ip->ip_off = cpu_to_be16(new_ip_off); 70702ef5fdcSAkihiko Odaki ip->ip_len = cpu_to_be16(l3hdr->iov_len + fragment_len); 70802ef5fdcSAkihiko Odaki 70902ef5fdcSAkihiko Odaki eth_fix_ip4_checksum(l3hdr->iov_base, l3hdr->iov_len); 71002ef5fdcSAkihiko Odaki } 71102ef5fdcSAkihiko Odaki 712605d52e6SDmitry Fleytman static bool net_tx_pkt_do_sw_fragmentation(struct NetTxPkt *pkt, 713ffbd2dbdSAkihiko Odaki NetTxPktCallback callback, 714ffbd2dbdSAkihiko Odaki void *context) 715e263cd49SDmitry Fleytman { 71602ef5fdcSAkihiko Odaki uint8_t gso_type = pkt->virt_hdr.gso_type & ~VIRTIO_NET_HDR_GSO_ECN; 717e263cd49SDmitry Fleytman 71802ef5fdcSAkihiko Odaki struct iovec fragment[NET_MAX_FRAG_SG_LIST]; 71902ef5fdcSAkihiko Odaki size_t fragment_len; 72002ef5fdcSAkihiko Odaki size_t l4hdr_len; 72102ef5fdcSAkihiko Odaki size_t src_len; 72202ef5fdcSAkihiko Odaki 72302ef5fdcSAkihiko Odaki int src_idx, dst_idx, pl_idx; 72402ef5fdcSAkihiko Odaki size_t src_offset; 725e263cd49SDmitry Fleytman size_t fragment_offset = 0; 726ffbd2dbdSAkihiko Odaki struct virtio_net_hdr virt_hdr = { 727ffbd2dbdSAkihiko Odaki .flags = pkt->virt_hdr.flags & VIRTIO_NET_HDR_F_NEEDS_CSUM ? 728ffbd2dbdSAkihiko Odaki VIRTIO_NET_HDR_F_DATA_VALID : 0 729ffbd2dbdSAkihiko Odaki }; 730e263cd49SDmitry Fleytman 731e263cd49SDmitry Fleytman /* Copy headers */ 732ffbd2dbdSAkihiko Odaki fragment[NET_TX_PKT_VHDR_FRAG].iov_base = &virt_hdr; 733ffbd2dbdSAkihiko Odaki fragment[NET_TX_PKT_VHDR_FRAG].iov_len = sizeof(virt_hdr); 73402ef5fdcSAkihiko Odaki fragment[NET_TX_PKT_L2HDR_FRAG] = pkt->vec[NET_TX_PKT_L2HDR_FRAG]; 73502ef5fdcSAkihiko Odaki fragment[NET_TX_PKT_L3HDR_FRAG] = pkt->vec[NET_TX_PKT_L3HDR_FRAG]; 736e263cd49SDmitry Fleytman 73702ef5fdcSAkihiko Odaki switch (gso_type) { 73802ef5fdcSAkihiko Odaki case VIRTIO_NET_HDR_GSO_TCPV4: 73902ef5fdcSAkihiko Odaki case VIRTIO_NET_HDR_GSO_TCPV6: 74002ef5fdcSAkihiko Odaki if (!net_tx_pkt_tcp_fragment_init(pkt, fragment, &pl_idx, &l4hdr_len, 74102ef5fdcSAkihiko Odaki &src_idx, &src_offset, &src_len)) { 74202ef5fdcSAkihiko Odaki return false; 74302ef5fdcSAkihiko Odaki } 74402ef5fdcSAkihiko Odaki break; 74502ef5fdcSAkihiko Odaki 74602ef5fdcSAkihiko Odaki case VIRTIO_NET_HDR_GSO_UDP: 74702ef5fdcSAkihiko Odaki net_tx_pkt_do_sw_csum(pkt, &pkt->vec[NET_TX_PKT_L2HDR_FRAG], 74802ef5fdcSAkihiko Odaki pkt->payload_frags + NET_TX_PKT_PL_START_FRAG - 1, 74902ef5fdcSAkihiko Odaki pkt->payload_len); 75002ef5fdcSAkihiko Odaki net_tx_pkt_udp_fragment_init(pkt, &pl_idx, &l4hdr_len, 75102ef5fdcSAkihiko Odaki &src_idx, &src_offset, &src_len); 75202ef5fdcSAkihiko Odaki break; 75302ef5fdcSAkihiko Odaki 75402ef5fdcSAkihiko Odaki default: 75502ef5fdcSAkihiko Odaki abort(); 75602ef5fdcSAkihiko Odaki } 757e263cd49SDmitry Fleytman 758e263cd49SDmitry Fleytman /* Put as much data as possible and send */ 75902ef5fdcSAkihiko Odaki while (true) { 76002ef5fdcSAkihiko Odaki dst_idx = pl_idx; 76102ef5fdcSAkihiko Odaki fragment_len = net_tx_pkt_fetch_fragment(pkt, 76202ef5fdcSAkihiko Odaki &src_idx, &src_offset, src_len, fragment, &dst_idx); 76302ef5fdcSAkihiko Odaki if (!fragment_len) { 76402ef5fdcSAkihiko Odaki break; 76502ef5fdcSAkihiko Odaki } 766e263cd49SDmitry Fleytman 76702ef5fdcSAkihiko Odaki switch (gso_type) { 76802ef5fdcSAkihiko Odaki case VIRTIO_NET_HDR_GSO_TCPV4: 76902ef5fdcSAkihiko Odaki case VIRTIO_NET_HDR_GSO_TCPV6: 77002ef5fdcSAkihiko Odaki net_tx_pkt_tcp_fragment_fix(pkt, fragment, fragment_len, gso_type); 77102ef5fdcSAkihiko Odaki net_tx_pkt_do_sw_csum(pkt, fragment + NET_TX_PKT_L2HDR_FRAG, 77202ef5fdcSAkihiko Odaki dst_idx - NET_TX_PKT_L2HDR_FRAG, 77302ef5fdcSAkihiko Odaki l4hdr_len + fragment_len); 77402ef5fdcSAkihiko Odaki break; 775e263cd49SDmitry Fleytman 77602ef5fdcSAkihiko Odaki case VIRTIO_NET_HDR_GSO_UDP: 77702ef5fdcSAkihiko Odaki net_tx_pkt_udp_fragment_fix(pkt, fragment, fragment_offset, 77802ef5fdcSAkihiko Odaki fragment_len); 77902ef5fdcSAkihiko Odaki break; 78002ef5fdcSAkihiko Odaki } 781e263cd49SDmitry Fleytman 782ffbd2dbdSAkihiko Odaki callback(context, 783ffbd2dbdSAkihiko Odaki fragment + NET_TX_PKT_L2HDR_FRAG, dst_idx - NET_TX_PKT_L2HDR_FRAG, 784ffbd2dbdSAkihiko Odaki fragment + NET_TX_PKT_VHDR_FRAG, dst_idx - NET_TX_PKT_VHDR_FRAG); 785e263cd49SDmitry Fleytman 78602ef5fdcSAkihiko Odaki if (gso_type == VIRTIO_NET_HDR_GSO_TCPV4 || 78702ef5fdcSAkihiko Odaki gso_type == VIRTIO_NET_HDR_GSO_TCPV6) { 78802ef5fdcSAkihiko Odaki net_tx_pkt_tcp_fragment_advance(pkt, fragment, fragment_len, 78902ef5fdcSAkihiko Odaki gso_type); 79002ef5fdcSAkihiko Odaki } 791e263cd49SDmitry Fleytman 79202ef5fdcSAkihiko Odaki fragment_offset += fragment_len; 79302ef5fdcSAkihiko Odaki } 79402ef5fdcSAkihiko Odaki 79502ef5fdcSAkihiko Odaki if (gso_type == VIRTIO_NET_HDR_GSO_TCPV4 || 79602ef5fdcSAkihiko Odaki gso_type == VIRTIO_NET_HDR_GSO_TCPV6) { 79702ef5fdcSAkihiko Odaki net_tx_pkt_tcp_fragment_deinit(fragment); 79802ef5fdcSAkihiko Odaki } 799e263cd49SDmitry Fleytman 800e263cd49SDmitry Fleytman return true; 801e263cd49SDmitry Fleytman } 802e263cd49SDmitry Fleytman 803605d52e6SDmitry Fleytman bool net_tx_pkt_send(struct NetTxPkt *pkt, NetClientState *nc) 804e263cd49SDmitry Fleytman { 805ffbd2dbdSAkihiko Odaki bool offload = qemu_get_using_vnet_hdr(nc->peer); 806ffbd2dbdSAkihiko Odaki return net_tx_pkt_send_custom(pkt, offload, net_tx_pkt_sendv, nc); 807ffbd2dbdSAkihiko Odaki } 80855daf493SAkihiko Odaki 809ffbd2dbdSAkihiko Odaki bool net_tx_pkt_send_custom(struct NetTxPkt *pkt, bool offload, 810ffbd2dbdSAkihiko Odaki NetTxPktCallback callback, void *context) 811ffbd2dbdSAkihiko Odaki { 812e263cd49SDmitry Fleytman assert(pkt); 813e263cd49SDmitry Fleytman 8144cf3a638SAkihiko Odaki uint8_t gso_type = pkt->virt_hdr.gso_type & ~VIRTIO_NET_HDR_GSO_ECN; 8154cf3a638SAkihiko Odaki 816e263cd49SDmitry Fleytman /* 817e263cd49SDmitry Fleytman * Since underlying infrastructure does not support IP datagrams longer 818e263cd49SDmitry Fleytman * than 64K we should drop such packets and don't even try to send 819e263cd49SDmitry Fleytman */ 8204cf3a638SAkihiko Odaki if (VIRTIO_NET_HDR_GSO_NONE != gso_type) { 821e263cd49SDmitry Fleytman if (pkt->payload_len > 822e263cd49SDmitry Fleytman ETH_MAX_IP_DGRAM_LEN - 823605d52e6SDmitry Fleytman pkt->vec[NET_TX_PKT_L3HDR_FRAG].iov_len) { 824e263cd49SDmitry Fleytman return false; 825e263cd49SDmitry Fleytman } 826e263cd49SDmitry Fleytman } 827e263cd49SDmitry Fleytman 8284cf3a638SAkihiko Odaki if (offload || gso_type == VIRTIO_NET_HDR_GSO_NONE) { 82902ef5fdcSAkihiko Odaki if (!offload && pkt->virt_hdr.flags & VIRTIO_NET_HDR_F_NEEDS_CSUM) { 83002ef5fdcSAkihiko Odaki net_tx_pkt_do_sw_csum(pkt, &pkt->vec[NET_TX_PKT_L2HDR_FRAG], 83102ef5fdcSAkihiko Odaki pkt->payload_frags + NET_TX_PKT_PL_START_FRAG - 1, 83202ef5fdcSAkihiko Odaki pkt->payload_len); 83302ef5fdcSAkihiko Odaki } 83402ef5fdcSAkihiko Odaki 835e219d309SAndrew net_tx_pkt_fix_ip6_payload_len(pkt); 836ffbd2dbdSAkihiko Odaki callback(context, pkt->vec + NET_TX_PKT_L2HDR_FRAG, 837ffbd2dbdSAkihiko Odaki pkt->payload_frags + NET_TX_PKT_PL_START_FRAG - NET_TX_PKT_L2HDR_FRAG, 838ffbd2dbdSAkihiko Odaki pkt->vec + NET_TX_PKT_VHDR_FRAG, 839ffbd2dbdSAkihiko Odaki pkt->payload_frags + NET_TX_PKT_PL_START_FRAG - NET_TX_PKT_VHDR_FRAG); 840e263cd49SDmitry Fleytman return true; 841e263cd49SDmitry Fleytman } 842e263cd49SDmitry Fleytman 843ffbd2dbdSAkihiko Odaki return net_tx_pkt_do_sw_fragmentation(pkt, callback, context); 844eb700029SDmitry Fleytman } 845e219d309SAndrew 846e219d309SAndrew void net_tx_pkt_fix_ip6_payload_len(struct NetTxPkt *pkt) 847e219d309SAndrew { 848e219d309SAndrew struct iovec *l2 = &pkt->vec[NET_TX_PKT_L2HDR_FRAG]; 849e219d309SAndrew if (eth_get_l3_proto(l2, 1, l2->iov_len) == ETH_P_IPV6) { 850e219d309SAndrew /* 851e219d309SAndrew * TODO: if qemu would support >64K packets - add jumbo option check 852e219d309SAndrew * something like that: 853e219d309SAndrew * 'if (ip6->ip6_plen == 0 && !has_jumbo_option(ip6)) {' 854e219d309SAndrew */ 8552a5f744eSAkihiko Odaki if (pkt->l3_hdr.ip6.ip6_plen == 0) { 856e219d309SAndrew if (pkt->payload_len <= ETH_MAX_IP_DGRAM_LEN) { 8572a5f744eSAkihiko Odaki pkt->l3_hdr.ip6.ip6_plen = htons(pkt->payload_len); 858e219d309SAndrew } 859e219d309SAndrew /* 860e219d309SAndrew * TODO: if qemu would support >64K packets 861e219d309SAndrew * add jumbo option for packets greater then 65,535 bytes 862e219d309SAndrew */ 863e219d309SAndrew } 864e219d309SAndrew } 865e219d309SAndrew } 866