2 * QEMU RX packets abstractions
4 * Copyright (c) 2012 Ravello Systems LTD (http://ravellosystems.com)
6 * Developed by Daynix Computing LTD (http://www.daynix.com)
9 * Dmitry Fleytman <dmitry@daynix.com>
10 * Tamir Shomer <tamirs@daynix.com>
11 * Yan Vugenfirer <yan@daynix.com>
13 * This work is licensed under the terms of the GNU GPL, version 2 or later.
14 * See the COPYING file in the top-level directory.
18 #include "qemu/osdep.h"
20 #include "net_rx_pkt.h"
21 #include "net/checksum.h"
25 struct virtio_net_hdr virt_hdr
;
26 uint8_t ehdr_buf
[sizeof(struct eth_header
)];
28 uint16_t vec_len_total
;
34 eth_pkt_types_e packet_type
;
36 /* Analysis results */
46 eth_ip6_hdr_info ip6hdr_info
;
47 eth_ip4_hdr_info ip4hdr_info
;
48 eth_l4_hdr_info l4hdr_info
;
51 void net_rx_pkt_init(struct NetRxPkt
**pkt
, bool has_virt_hdr
)
53 struct NetRxPkt
*p
= g_malloc0(sizeof *p
);
54 p
->has_virt_hdr
= has_virt_hdr
;
60 void net_rx_pkt_uninit(struct NetRxPkt
*pkt
)
62 if (pkt
->vec_len_total
!= 0) {
69 struct virtio_net_hdr
*net_rx_pkt_get_vhdr(struct NetRxPkt
*pkt
)
72 return &pkt
->virt_hdr
;
76 net_rx_pkt_iovec_realloc(struct NetRxPkt
*pkt
,
79 if (pkt
->vec_len_total
< new_iov_len
) {
81 pkt
->vec
= g_malloc(sizeof(*pkt
->vec
) * new_iov_len
);
82 pkt
->vec_len_total
= new_iov_len
;
87 net_rx_pkt_pull_data(struct NetRxPkt
*pkt
,
88 const struct iovec
*iov
, int iovcnt
,
91 if (pkt
->vlan_stripped
) {
92 net_rx_pkt_iovec_realloc(pkt
, iovcnt
+ 1);
94 pkt
->vec
[0].iov_base
= pkt
->ehdr_buf
;
95 pkt
->vec
[0].iov_len
= sizeof(pkt
->ehdr_buf
);
98 iov_size(iov
, iovcnt
) - ploff
+ sizeof(struct eth_header
);
100 pkt
->vec_len
= iov_copy(pkt
->vec
+ 1, pkt
->vec_len_total
- 1,
101 iov
, iovcnt
, ploff
, pkt
->tot_len
);
103 net_rx_pkt_iovec_realloc(pkt
, iovcnt
);
105 pkt
->tot_len
= iov_size(iov
, iovcnt
) - ploff
;
106 pkt
->vec_len
= iov_copy(pkt
->vec
, pkt
->vec_len_total
,
107 iov
, iovcnt
, ploff
, pkt
->tot_len
);
110 eth_get_protocols(pkt
->vec
, pkt
->vec_len
, &pkt
->isip4
, &pkt
->isip6
,
111 &pkt
->isudp
, &pkt
->istcp
,
112 &pkt
->l3hdr_off
, &pkt
->l4hdr_off
, &pkt
->l5hdr_off
,
113 &pkt
->ip6hdr_info
, &pkt
->ip4hdr_info
, &pkt
->l4hdr_info
);
115 trace_net_rx_pkt_parsed(pkt
->isip4
, pkt
->isip6
, pkt
->isudp
, pkt
->istcp
,
116 pkt
->l3hdr_off
, pkt
->l4hdr_off
, pkt
->l5hdr_off
);
119 void net_rx_pkt_attach_iovec(struct NetRxPkt
*pkt
,
120 const struct iovec
*iov
, int iovcnt
,
121 size_t iovoff
, bool strip_vlan
)
124 uint16_t ploff
= iovoff
;
126 pkt
->vlan_stripped
= false;
129 pkt
->vlan_stripped
= eth_strip_vlan(iov
, iovcnt
, iovoff
, pkt
->ehdr_buf
,
135 net_rx_pkt_pull_data(pkt
, iov
, iovcnt
, ploff
);
138 void net_rx_pkt_attach_iovec_ex(struct NetRxPkt
*pkt
,
139 const struct iovec
*iov
, int iovcnt
,
140 size_t iovoff
, bool strip_vlan
,
144 uint16_t ploff
= iovoff
;
146 pkt
->vlan_stripped
= false;
149 pkt
->vlan_stripped
= eth_strip_vlan_ex(iov
, iovcnt
, iovoff
, vet
,
156 net_rx_pkt_pull_data(pkt
, iov
, iovcnt
, ploff
);
159 void net_rx_pkt_dump(struct NetRxPkt
*pkt
)
161 #ifdef NET_RX_PKT_DEBUG
162 NetRxPkt
*pkt
= (NetRxPkt
*)pkt
;
165 printf("RX PKT: tot_len: %d, vlan_stripped: %d, vlan_tag: %d\n",
166 pkt
->tot_len
, pkt
->vlan_stripped
, pkt
->tci
);
170 void net_rx_pkt_set_packet_type(struct NetRxPkt
*pkt
,
171 eth_pkt_types_e packet_type
)
175 pkt
->packet_type
= packet_type
;
179 eth_pkt_types_e
net_rx_pkt_get_packet_type(struct NetRxPkt
*pkt
)
183 return pkt
->packet_type
;
186 size_t net_rx_pkt_get_total_len(struct NetRxPkt
*pkt
)
193 void net_rx_pkt_set_protocols(struct NetRxPkt
*pkt
, const void *data
,
196 const struct iovec iov
= {
197 .iov_base
= (void *)data
,
203 eth_get_protocols(&iov
, 1, &pkt
->isip4
, &pkt
->isip6
,
204 &pkt
->isudp
, &pkt
->istcp
,
205 &pkt
->l3hdr_off
, &pkt
->l4hdr_off
, &pkt
->l5hdr_off
,
206 &pkt
->ip6hdr_info
, &pkt
->ip4hdr_info
, &pkt
->l4hdr_info
);
209 void net_rx_pkt_get_protocols(struct NetRxPkt
*pkt
,
210 bool *isip4
, bool *isip6
,
211 bool *isudp
, bool *istcp
)
221 size_t net_rx_pkt_get_l3_hdr_offset(struct NetRxPkt
*pkt
)
224 return pkt
->l3hdr_off
;
227 size_t net_rx_pkt_get_l4_hdr_offset(struct NetRxPkt
*pkt
)
230 return pkt
->l4hdr_off
;
233 size_t net_rx_pkt_get_l5_hdr_offset(struct NetRxPkt
*pkt
)
236 return pkt
->l5hdr_off
;
239 eth_ip6_hdr_info
*net_rx_pkt_get_ip6_info(struct NetRxPkt
*pkt
)
241 return &pkt
->ip6hdr_info
;
244 eth_ip4_hdr_info
*net_rx_pkt_get_ip4_info(struct NetRxPkt
*pkt
)
246 return &pkt
->ip4hdr_info
;
249 eth_l4_hdr_info
*net_rx_pkt_get_l4_info(struct NetRxPkt
*pkt
)
251 return &pkt
->l4hdr_info
;
255 _net_rx_rss_add_chunk(uint8_t *rss_input
, size_t *bytes_written
,
256 void *ptr
, size_t size
)
258 memcpy(&rss_input
[*bytes_written
], ptr
, size
);
259 trace_net_rx_pkt_rss_add_chunk(ptr
, size
, *bytes_written
);
260 *bytes_written
+= size
;
264 _net_rx_rss_prepare_ip4(uint8_t *rss_input
,
265 struct NetRxPkt
*pkt
,
266 size_t *bytes_written
)
268 struct ip_header
*ip4_hdr
= &pkt
->ip4hdr_info
.ip4_hdr
;
270 _net_rx_rss_add_chunk(rss_input
, bytes_written
,
271 &ip4_hdr
->ip_src
, sizeof(uint32_t));
273 _net_rx_rss_add_chunk(rss_input
, bytes_written
,
274 &ip4_hdr
->ip_dst
, sizeof(uint32_t));
278 _net_rx_rss_prepare_ip6(uint8_t *rss_input
,
279 struct NetRxPkt
*pkt
,
280 bool ipv6ex
, size_t *bytes_written
)
282 eth_ip6_hdr_info
*ip6info
= &pkt
->ip6hdr_info
;
284 _net_rx_rss_add_chunk(rss_input
, bytes_written
,
285 (ipv6ex
&& ip6info
->rss_ex_src_valid
) ? &ip6info
->rss_ex_src
286 : &ip6info
->ip6_hdr
.ip6_src
,
287 sizeof(struct in6_address
));
289 _net_rx_rss_add_chunk(rss_input
, bytes_written
,
290 (ipv6ex
&& ip6info
->rss_ex_dst_valid
) ? &ip6info
->rss_ex_dst
291 : &ip6info
->ip6_hdr
.ip6_dst
,
292 sizeof(struct in6_address
));
296 _net_rx_rss_prepare_tcp(uint8_t *rss_input
,
297 struct NetRxPkt
*pkt
,
298 size_t *bytes_written
)
300 struct tcp_header
*tcphdr
= &pkt
->l4hdr_info
.hdr
.tcp
;
302 _net_rx_rss_add_chunk(rss_input
, bytes_written
,
303 &tcphdr
->th_sport
, sizeof(uint16_t));
305 _net_rx_rss_add_chunk(rss_input
, bytes_written
,
306 &tcphdr
->th_dport
, sizeof(uint16_t));
310 net_rx_pkt_calc_rss_hash(struct NetRxPkt
*pkt
,
311 NetRxPktRssType type
,
314 uint8_t rss_input
[36];
315 size_t rss_length
= 0;
316 uint32_t rss_hash
= 0;
317 net_toeplitz_key key_data
;
322 trace_net_rx_pkt_rss_ip4();
323 _net_rx_rss_prepare_ip4(&rss_input
[0], pkt
, &rss_length
);
325 case NetPktRssIpV4Tcp
:
328 trace_net_rx_pkt_rss_ip4_tcp();
329 _net_rx_rss_prepare_ip4(&rss_input
[0], pkt
, &rss_length
);
330 _net_rx_rss_prepare_tcp(&rss_input
[0], pkt
, &rss_length
);
332 case NetPktRssIpV6Tcp
:
335 trace_net_rx_pkt_rss_ip6_tcp();
336 _net_rx_rss_prepare_ip6(&rss_input
[0], pkt
, true, &rss_length
);
337 _net_rx_rss_prepare_tcp(&rss_input
[0], pkt
, &rss_length
);
341 trace_net_rx_pkt_rss_ip6();
342 _net_rx_rss_prepare_ip6(&rss_input
[0], pkt
, false, &rss_length
);
344 case NetPktRssIpV6Ex
:
346 trace_net_rx_pkt_rss_ip6_ex();
347 _net_rx_rss_prepare_ip6(&rss_input
[0], pkt
, true, &rss_length
);
354 net_toeplitz_key_init(&key_data
, key
);
355 net_toeplitz_add(&rss_hash
, rss_input
, rss_length
, &key_data
);
357 trace_net_rx_pkt_rss_hash(rss_length
, rss_hash
);
362 uint16_t net_rx_pkt_get_ip_id(struct NetRxPkt
*pkt
)
367 return be16_to_cpu(pkt
->ip4hdr_info
.ip4_hdr
.ip_id
);
373 bool net_rx_pkt_is_tcp_ack(struct NetRxPkt
*pkt
)
378 return TCP_HEADER_FLAGS(&pkt
->l4hdr_info
.hdr
.tcp
) & TCP_FLAG_ACK
;
384 bool net_rx_pkt_has_tcp_data(struct NetRxPkt
*pkt
)
389 return pkt
->l4hdr_info
.has_tcp_data
;
395 struct iovec
*net_rx_pkt_get_iovec(struct NetRxPkt
*pkt
)
402 uint16_t net_rx_pkt_get_iovec_len(struct NetRxPkt
*pkt
)
409 void net_rx_pkt_set_vhdr(struct NetRxPkt
*pkt
,
410 struct virtio_net_hdr
*vhdr
)
414 memcpy(&pkt
->virt_hdr
, vhdr
, sizeof pkt
->virt_hdr
);
417 void net_rx_pkt_set_vhdr_iovec(struct NetRxPkt
*pkt
,
418 const struct iovec
*iov
, int iovcnt
)
422 iov_to_buf(iov
, iovcnt
, 0, &pkt
->virt_hdr
, sizeof pkt
->virt_hdr
);
425 bool net_rx_pkt_is_vlan_stripped(struct NetRxPkt
*pkt
)
429 return pkt
->vlan_stripped
;
432 bool net_rx_pkt_has_virt_hdr(struct NetRxPkt
*pkt
)
436 return pkt
->has_virt_hdr
;
439 uint16_t net_rx_pkt_get_vlan_tag(struct NetRxPkt
*pkt
)
446 bool net_rx_pkt_validate_l3_csum(struct NetRxPkt
*pkt
, bool *csum_valid
)
452 trace_net_rx_pkt_l3_csum_validate_entry();
455 trace_net_rx_pkt_l3_csum_validate_not_ip4();
459 csl
= pkt
->l4hdr_off
- pkt
->l3hdr_off
;
461 cntr
= net_checksum_add_iov(pkt
->vec
, pkt
->vec_len
,
465 csum
= net_checksum_finish(cntr
);
467 *csum_valid
= (csum
== 0);
469 trace_net_rx_pkt_l3_csum_validate_csum(pkt
->l3hdr_off
, csl
,
470 cntr
, csum
, *csum_valid
);
476 _net_rx_pkt_calc_l4_csum(struct NetRxPkt
*pkt
)
483 trace_net_rx_pkt_l4_csum_calc_entry();
487 csl
= be16_to_cpu(pkt
->l4hdr_info
.hdr
.udp
.uh_ulen
);
488 trace_net_rx_pkt_l4_csum_calc_ip4_udp();
490 csl
= be16_to_cpu(pkt
->ip4hdr_info
.ip4_hdr
.ip_len
) -
491 IP_HDR_GET_LEN(&pkt
->ip4hdr_info
.ip4_hdr
);
492 trace_net_rx_pkt_l4_csum_calc_ip4_tcp();
495 cntr
= eth_calc_ip4_pseudo_hdr_csum(&pkt
->ip4hdr_info
.ip4_hdr
,
497 trace_net_rx_pkt_l4_csum_calc_ph_csum(cntr
, csl
);
500 csl
= be16_to_cpu(pkt
->l4hdr_info
.hdr
.udp
.uh_ulen
);
501 trace_net_rx_pkt_l4_csum_calc_ip6_udp();
503 struct ip6_header
*ip6hdr
= &pkt
->ip6hdr_info
.ip6_hdr
;
504 size_t full_ip6hdr_len
= pkt
->l4hdr_off
- pkt
->l3hdr_off
;
505 size_t ip6opts_len
= full_ip6hdr_len
- sizeof(struct ip6_header
);
507 csl
= be16_to_cpu(ip6hdr
->ip6_ctlun
.ip6_un1
.ip6_un1_plen
) -
509 trace_net_rx_pkt_l4_csum_calc_ip6_tcp();
512 cntr
= eth_calc_ip6_pseudo_hdr_csum(&pkt
->ip6hdr_info
.ip6_hdr
, csl
,
513 pkt
->ip6hdr_info
.l4proto
, &cso
);
514 trace_net_rx_pkt_l4_csum_calc_ph_csum(cntr
, csl
);
517 cntr
+= net_checksum_add_iov(pkt
->vec
, pkt
->vec_len
,
518 pkt
->l4hdr_off
, csl
, cso
);
520 csum
= net_checksum_finish(cntr
);
522 trace_net_rx_pkt_l4_csum_calc_csum(pkt
->l4hdr_off
, csl
, cntr
, csum
);
527 bool net_rx_pkt_validate_l4_csum(struct NetRxPkt
*pkt
, bool *csum_valid
)
531 trace_net_rx_pkt_l4_csum_validate_entry();
533 if (!pkt
->istcp
&& !pkt
->isudp
) {
534 trace_net_rx_pkt_l4_csum_validate_not_xxp();
538 if (pkt
->isudp
&& (pkt
->l4hdr_info
.hdr
.udp
.uh_sum
== 0)) {
539 trace_net_rx_pkt_l4_csum_validate_udp_with_no_checksum();
543 if (pkt
->isip4
&& pkt
->ip4hdr_info
.fragment
) {
544 trace_net_rx_pkt_l4_csum_validate_ip4_fragment();
548 csum
= _net_rx_pkt_calc_l4_csum(pkt
);
550 *csum_valid
= ((csum
== 0) || (csum
== 0xFFFF));
552 trace_net_rx_pkt_l4_csum_validate_csum(*csum_valid
);
557 bool net_rx_pkt_fix_l4_csum(struct NetRxPkt
*pkt
)
562 trace_net_rx_pkt_l4_csum_fix_entry();
565 l4_cso
= offsetof(struct tcp_header
, th_sum
);
566 trace_net_rx_pkt_l4_csum_fix_tcp(l4_cso
);
567 } else if (pkt
->isudp
) {
568 if (pkt
->l4hdr_info
.hdr
.udp
.uh_sum
== 0) {
569 trace_net_rx_pkt_l4_csum_fix_udp_with_no_checksum();
572 l4_cso
= offsetof(struct udp_header
, uh_sum
);
573 trace_net_rx_pkt_l4_csum_fix_udp(l4_cso
);
575 trace_net_rx_pkt_l4_csum_fix_not_xxp();
579 if (pkt
->isip4
&& pkt
->ip4hdr_info
.fragment
) {
580 trace_net_rx_pkt_l4_csum_fix_ip4_fragment();
584 /* Set zero to checksum word */
585 iov_from_buf(pkt
->vec
, pkt
->vec_len
,
586 pkt
->l4hdr_off
+ l4_cso
,
587 &csum
, sizeof(csum
));
589 /* Calculate L4 checksum */
590 csum
= cpu_to_be16(_net_rx_pkt_calc_l4_csum(pkt
));
592 /* Set calculated checksum to checksum word */
593 iov_from_buf(pkt
->vec
, pkt
->vec_len
,
594 pkt
->l4hdr_off
+ l4_cso
,
595 &csum
, sizeof(csum
));
597 trace_net_rx_pkt_l4_csum_fix_csum(pkt
->l4hdr_off
+ l4_cso
, csum
);