2 * QEMU RX packets abstractions
4 * Copyright (c) 2012 Ravello Systems LTD (http://ravellosystems.com)
6 * Developed by Daynix Computing LTD (http://www.daynix.com)
13 * This work is licensed under the terms of the GNU GPL, version 2 or later.
14 * See the COPYING file in the top-level directory.
18 #include "qemu/osdep.h"
20 #include "net_rx_pkt.h"
21 #include "net/checksum.h"
25 struct virtio_net_hdr virt_hdr;
26 uint8_t ehdr_buf[sizeof(struct eth_header) + sizeof(struct vlan_header)];
28 uint16_t vec_len_total;
34 eth_pkt_types_e packet_type;
36 /* Analysis results */
46 eth_ip6_hdr_info ip6hdr_info;
47 eth_ip4_hdr_info ip4hdr_info;
48 eth_l4_hdr_info l4hdr_info;
51 void net_rx_pkt_init(struct NetRxPkt **pkt, bool has_virt_hdr)
53 struct NetRxPkt *p = g_malloc0(sizeof *p);
54 p->has_virt_hdr = has_virt_hdr;
60 void net_rx_pkt_uninit(struct NetRxPkt *pkt)
62 if (pkt->vec_len_total != 0) {
69 struct virtio_net_hdr *net_rx_pkt_get_vhdr(struct NetRxPkt *pkt)
72 return &pkt->virt_hdr;
76 net_rx_pkt_iovec_realloc(struct NetRxPkt *pkt,
79 if (pkt->vec_len_total < new_iov_len) {
81 pkt->vec = g_malloc(sizeof(*pkt->vec) * new_iov_len);
82 pkt->vec_len_total = new_iov_len;
87 net_rx_pkt_pull_data(struct NetRxPkt *pkt,
88 const struct iovec *iov, int iovcnt,
91 uint32_t pllen = iov_size(iov, iovcnt) - ploff;
93 if (pkt->ehdr_buf_len) {
94 net_rx_pkt_iovec_realloc(pkt, iovcnt + 1);
96 pkt->vec[0].iov_base = pkt->ehdr_buf;
97 pkt->vec[0].iov_len = pkt->ehdr_buf_len;
99 pkt->tot_len = pllen + pkt->ehdr_buf_len;
100 pkt->vec_len = iov_copy(pkt->vec + 1, pkt->vec_len_total - 1,
101 iov, iovcnt, ploff, pllen) + 1;
103 net_rx_pkt_iovec_realloc(pkt, iovcnt);
105 pkt->tot_len = pllen;
106 pkt->vec_len = iov_copy(pkt->vec, pkt->vec_len_total,
107 iov, iovcnt, ploff, pkt->tot_len);
110 eth_get_protocols(pkt->vec, pkt->vec_len, &pkt->isip4, &pkt->isip6,
111 &pkt->isudp, &pkt->istcp,
112 &pkt->l3hdr_off, &pkt->l4hdr_off, &pkt->l5hdr_off,
113 &pkt->ip6hdr_info, &pkt->ip4hdr_info, &pkt->l4hdr_info);
115 trace_net_rx_pkt_parsed(pkt->isip4, pkt->isip6, pkt->isudp, pkt->istcp,
116 pkt->l3hdr_off, pkt->l4hdr_off, pkt->l5hdr_off);
119 void net_rx_pkt_attach_iovec(struct NetRxPkt *pkt,
120 const struct iovec *iov, int iovcnt,
121 size_t iovoff, bool strip_vlan)
124 uint16_t ploff = iovoff;
128 pkt->ehdr_buf_len = eth_strip_vlan(iov, iovcnt, iovoff, pkt->ehdr_buf,
131 pkt->ehdr_buf_len = 0;
136 net_rx_pkt_pull_data(pkt, iov, iovcnt, ploff);
139 void net_rx_pkt_attach_iovec_ex(struct NetRxPkt *pkt,
140 const struct iovec *iov, int iovcnt,
141 size_t iovoff, bool strip_vlan,
145 uint16_t ploff = iovoff;
149 pkt->ehdr_buf_len = eth_strip_vlan_ex(iov, iovcnt, iovoff, vet,
153 pkt->ehdr_buf_len = 0;
158 net_rx_pkt_pull_data(pkt, iov, iovcnt, ploff);
161 void net_rx_pkt_dump(struct NetRxPkt *pkt)
163 #ifdef NET_RX_PKT_DEBUG
166 printf("RX PKT: tot_len: %d, ehdr_buf_len: %lu, vlan_tag: %d\n",
167 pkt->tot_len, pkt->ehdr_buf_len, pkt->tci);
171 void net_rx_pkt_set_packet_type(struct NetRxPkt *pkt,
172 eth_pkt_types_e packet_type)
176 pkt->packet_type = packet_type;
180 eth_pkt_types_e net_rx_pkt_get_packet_type(struct NetRxPkt *pkt)
184 return pkt->packet_type;
187 size_t net_rx_pkt_get_total_len(struct NetRxPkt *pkt)
194 void net_rx_pkt_set_protocols(struct NetRxPkt *pkt, const void *data,
197 const struct iovec iov = {
198 .iov_base = (void *)data,
204 eth_get_protocols(&iov, 1, &pkt->isip4, &pkt->isip6,
205 &pkt->isudp, &pkt->istcp,
206 &pkt->l3hdr_off, &pkt->l4hdr_off, &pkt->l5hdr_off,
207 &pkt->ip6hdr_info, &pkt->ip4hdr_info, &pkt->l4hdr_info);
210 void net_rx_pkt_get_protocols(struct NetRxPkt *pkt,
211 bool *isip4, bool *isip6,
212 bool *isudp, bool *istcp)
222 size_t net_rx_pkt_get_l3_hdr_offset(struct NetRxPkt *pkt)
225 return pkt->l3hdr_off;
228 size_t net_rx_pkt_get_l4_hdr_offset(struct NetRxPkt *pkt)
231 return pkt->l4hdr_off;
234 size_t net_rx_pkt_get_l5_hdr_offset(struct NetRxPkt *pkt)
237 return pkt->l5hdr_off;
240 eth_ip6_hdr_info *net_rx_pkt_get_ip6_info(struct NetRxPkt *pkt)
242 return &pkt->ip6hdr_info;
245 eth_ip4_hdr_info *net_rx_pkt_get_ip4_info(struct NetRxPkt *pkt)
247 return &pkt->ip4hdr_info;
250 eth_l4_hdr_info *net_rx_pkt_get_l4_info(struct NetRxPkt *pkt)
252 return &pkt->l4hdr_info;
256 _net_rx_rss_add_chunk(uint8_t *rss_input, size_t *bytes_written,
257 void *ptr, size_t size)
259 memcpy(&rss_input[*bytes_written], ptr, size);
260 trace_net_rx_pkt_rss_add_chunk(ptr, size, *bytes_written);
261 *bytes_written += size;
265 _net_rx_rss_prepare_ip4(uint8_t *rss_input,
266 struct NetRxPkt *pkt,
267 size_t *bytes_written)
269 struct ip_header *ip4_hdr = &pkt->ip4hdr_info.ip4_hdr;
271 _net_rx_rss_add_chunk(rss_input, bytes_written,
272 &ip4_hdr->ip_src, sizeof(uint32_t));
274 _net_rx_rss_add_chunk(rss_input, bytes_written,
275 &ip4_hdr->ip_dst, sizeof(uint32_t));
279 _net_rx_rss_prepare_ip6(uint8_t *rss_input,
280 struct NetRxPkt *pkt,
281 bool ipv6ex, size_t *bytes_written)
283 eth_ip6_hdr_info *ip6info = &pkt->ip6hdr_info;
285 _net_rx_rss_add_chunk(rss_input, bytes_written,
286 (ipv6ex && ip6info->rss_ex_src_valid) ? &ip6info->rss_ex_src
287 : &ip6info->ip6_hdr.ip6_src,
288 sizeof(struct in6_address));
290 _net_rx_rss_add_chunk(rss_input, bytes_written,
291 (ipv6ex && ip6info->rss_ex_dst_valid) ? &ip6info->rss_ex_dst
292 : &ip6info->ip6_hdr.ip6_dst,
293 sizeof(struct in6_address));
297 _net_rx_rss_prepare_tcp(uint8_t *rss_input,
298 struct NetRxPkt *pkt,
299 size_t *bytes_written)
301 struct tcp_header *tcphdr = &pkt->l4hdr_info.hdr.tcp;
303 _net_rx_rss_add_chunk(rss_input, bytes_written,
304 &tcphdr->th_sport, sizeof(uint16_t));
306 _net_rx_rss_add_chunk(rss_input, bytes_written,
307 &tcphdr->th_dport, sizeof(uint16_t));
311 net_rx_pkt_calc_rss_hash(struct NetRxPkt *pkt,
312 NetRxPktRssType type,
315 uint8_t rss_input[36];
316 size_t rss_length = 0;
317 uint32_t rss_hash = 0;
318 net_toeplitz_key key_data;
323 trace_net_rx_pkt_rss_ip4();
324 _net_rx_rss_prepare_ip4(&rss_input[0], pkt, &rss_length);
326 case NetPktRssIpV4Tcp:
329 trace_net_rx_pkt_rss_ip4_tcp();
330 _net_rx_rss_prepare_ip4(&rss_input[0], pkt, &rss_length);
331 _net_rx_rss_prepare_tcp(&rss_input[0], pkt, &rss_length);
333 case NetPktRssIpV6Tcp:
336 trace_net_rx_pkt_rss_ip6_tcp();
337 _net_rx_rss_prepare_ip6(&rss_input[0], pkt, true, &rss_length);
338 _net_rx_rss_prepare_tcp(&rss_input[0], pkt, &rss_length);
342 trace_net_rx_pkt_rss_ip6();
343 _net_rx_rss_prepare_ip6(&rss_input[0], pkt, false, &rss_length);
345 case NetPktRssIpV6Ex:
347 trace_net_rx_pkt_rss_ip6_ex();
348 _net_rx_rss_prepare_ip6(&rss_input[0], pkt, true, &rss_length);
355 net_toeplitz_key_init(&key_data, key);
356 net_toeplitz_add(&rss_hash, rss_input, rss_length, &key_data);
358 trace_net_rx_pkt_rss_hash(rss_length, rss_hash);
363 uint16_t net_rx_pkt_get_ip_id(struct NetRxPkt *pkt)
368 return be16_to_cpu(pkt->ip4hdr_info.ip4_hdr.ip_id);
374 bool net_rx_pkt_is_tcp_ack(struct NetRxPkt *pkt)
379 return TCP_HEADER_FLAGS(&pkt->l4hdr_info.hdr.tcp) & TCP_FLAG_ACK;
385 bool net_rx_pkt_has_tcp_data(struct NetRxPkt *pkt)
390 return pkt->l4hdr_info.has_tcp_data;
396 struct iovec *net_rx_pkt_get_iovec(struct NetRxPkt *pkt)
403 uint16_t net_rx_pkt_get_iovec_len(struct NetRxPkt *pkt)
410 void net_rx_pkt_set_vhdr(struct NetRxPkt *pkt,
411 struct virtio_net_hdr *vhdr)
415 memcpy(&pkt->virt_hdr, vhdr, sizeof pkt->virt_hdr);
418 void net_rx_pkt_set_vhdr_iovec(struct NetRxPkt *pkt,
419 const struct iovec *iov, int iovcnt)
423 iov_to_buf(iov, iovcnt, 0, &pkt->virt_hdr, sizeof pkt->virt_hdr);
426 bool net_rx_pkt_is_vlan_stripped(struct NetRxPkt *pkt)
430 return pkt->ehdr_buf_len ? true : false;
433 bool net_rx_pkt_has_virt_hdr(struct NetRxPkt *pkt)
437 return pkt->has_virt_hdr;
440 uint16_t net_rx_pkt_get_vlan_tag(struct NetRxPkt *pkt)
447 bool net_rx_pkt_validate_l3_csum(struct NetRxPkt *pkt, bool *csum_valid)
453 trace_net_rx_pkt_l3_csum_validate_entry();
456 trace_net_rx_pkt_l3_csum_validate_not_ip4();
460 csl = pkt->l4hdr_off - pkt->l3hdr_off;
462 cntr = net_checksum_add_iov(pkt->vec, pkt->vec_len,
466 csum = net_checksum_finish(cntr);
468 *csum_valid = (csum == 0);
470 trace_net_rx_pkt_l3_csum_validate_csum(pkt->l3hdr_off, csl,
471 cntr, csum, *csum_valid);
477 _net_rx_pkt_calc_l4_csum(struct NetRxPkt *pkt)
484 trace_net_rx_pkt_l4_csum_calc_entry();
488 csl = be16_to_cpu(pkt->l4hdr_info.hdr.udp.uh_ulen);
489 trace_net_rx_pkt_l4_csum_calc_ip4_udp();
491 csl = be16_to_cpu(pkt->ip4hdr_info.ip4_hdr.ip_len) -
492 IP_HDR_GET_LEN(&pkt->ip4hdr_info.ip4_hdr);
493 trace_net_rx_pkt_l4_csum_calc_ip4_tcp();
496 cntr = eth_calc_ip4_pseudo_hdr_csum(&pkt->ip4hdr_info.ip4_hdr,
498 trace_net_rx_pkt_l4_csum_calc_ph_csum(cntr, csl);
501 csl = be16_to_cpu(pkt->l4hdr_info.hdr.udp.uh_ulen);
502 trace_net_rx_pkt_l4_csum_calc_ip6_udp();
504 struct ip6_header *ip6hdr = &pkt->ip6hdr_info.ip6_hdr;
505 size_t full_ip6hdr_len = pkt->l4hdr_off - pkt->l3hdr_off;
506 size_t ip6opts_len = full_ip6hdr_len - sizeof(struct ip6_header);
508 csl = be16_to_cpu(ip6hdr->ip6_ctlun.ip6_un1.ip6_un1_plen) -
510 trace_net_rx_pkt_l4_csum_calc_ip6_tcp();
513 cntr = eth_calc_ip6_pseudo_hdr_csum(&pkt->ip6hdr_info.ip6_hdr, csl,
514 pkt->ip6hdr_info.l4proto, &cso);
515 trace_net_rx_pkt_l4_csum_calc_ph_csum(cntr, csl);
518 cntr += net_checksum_add_iov(pkt->vec, pkt->vec_len,
519 pkt->l4hdr_off, csl, cso);
521 csum = net_checksum_finish_nozero(cntr);
523 trace_net_rx_pkt_l4_csum_calc_csum(pkt->l4hdr_off, csl, cntr, csum);
528 bool net_rx_pkt_validate_l4_csum(struct NetRxPkt *pkt, bool *csum_valid)
532 trace_net_rx_pkt_l4_csum_validate_entry();
534 if (!pkt->istcp && !pkt->isudp) {
535 trace_net_rx_pkt_l4_csum_validate_not_xxp();
539 if (pkt->isudp && (pkt->l4hdr_info.hdr.udp.uh_sum == 0)) {
540 trace_net_rx_pkt_l4_csum_validate_udp_with_no_checksum();
544 if (pkt->isip4 && pkt->ip4hdr_info.fragment) {
545 trace_net_rx_pkt_l4_csum_validate_ip4_fragment();
549 csum = _net_rx_pkt_calc_l4_csum(pkt);
551 *csum_valid = ((csum == 0) || (csum == 0xFFFF));
553 trace_net_rx_pkt_l4_csum_validate_csum(*csum_valid);
558 bool net_rx_pkt_fix_l4_csum(struct NetRxPkt *pkt)
563 trace_net_rx_pkt_l4_csum_fix_entry();
566 l4_cso = offsetof(struct tcp_header, th_sum);
567 trace_net_rx_pkt_l4_csum_fix_tcp(l4_cso);
568 } else if (pkt->isudp) {
569 if (pkt->l4hdr_info.hdr.udp.uh_sum == 0) {
570 trace_net_rx_pkt_l4_csum_fix_udp_with_no_checksum();
573 l4_cso = offsetof(struct udp_header, uh_sum);
574 trace_net_rx_pkt_l4_csum_fix_udp(l4_cso);
576 trace_net_rx_pkt_l4_csum_fix_not_xxp();
580 if (pkt->isip4 && pkt->ip4hdr_info.fragment) {
581 trace_net_rx_pkt_l4_csum_fix_ip4_fragment();
585 /* Set zero to checksum word */
586 iov_from_buf(pkt->vec, pkt->vec_len,
587 pkt->l4hdr_off + l4_cso,
588 &csum, sizeof(csum));
590 /* Calculate L4 checksum */
591 csum = cpu_to_be16(_net_rx_pkt_calc_l4_csum(pkt));
593 /* Set calculated checksum to checksum word */
594 iov_from_buf(pkt->vec, pkt->vec_len,
595 pkt->l4hdr_off + l4_cso,
596 &csum, sizeof(csum));
598 trace_net_rx_pkt_l4_csum_fix_csum(pkt->l4hdr_off + l4_cso, csum);