4 * Copyright (c) 2004-2008 Fabrice Bellard
6 * Permission is hereby granted, free of charge, to any person obtaining a copy
7 * of this software and associated documentation files (the "Software"), to deal
8 * in the Software without restriction, including without limitation the rights
9 * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
10 * copies of the Software, and to permit persons to whom the Software is
11 * furnished to do so, subject to the following conditions:
13 * The above copyright notice and this permission notice shall be included in
14 * all copies or substantial portions of the Software.
16 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
17 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
18 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
19 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
20 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
21 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
24 #include "qemu/osdep.h"
25 #include "qemu-common.h"
26 #include "qemu/timer.h"
27 #include "qemu/error-report.h"
28 #include "chardev/char-fe.h"
29 #include "migration/register.h"
32 #include "qemu/cutils.h"
38 /* host loopback address */
39 struct in_addr loopback_addr
;
40 /* host loopback network mask */
41 unsigned long loopback_mask
;
43 /* emulated hosts use the MAC addr 52:55:IP:IP:IP:IP */
44 static const uint8_t special_ethaddr
[ETH_ALEN
] = {
45 0x52, 0x55, 0x00, 0x00, 0x00, 0x00
50 static QTAILQ_HEAD(, Slirp
) slirp_instances
=
51 QTAILQ_HEAD_INITIALIZER(slirp_instances
);
53 static struct in_addr dns_addr
;
55 static struct in6_addr dns6_addr
;
57 static u_int dns_addr_time
;
59 static u_int dns6_addr_time
;
62 #define TIMEOUT_FAST 2 /* milliseconds */
63 #define TIMEOUT_SLOW 499 /* milliseconds */
64 /* for the aging of certain requests like DNS */
65 #define TIMEOUT_DEFAULT 1000 /* milliseconds */
69 int get_dns_addr(struct in_addr
*pdns_addr
)
71 FIXED_INFO
*FixedInfo
=NULL
;
74 IP_ADDR_STRING
*pIPAddr
;
75 struct in_addr tmp_addr
;
77 if (dns_addr
.s_addr
!= 0 && (curtime
- dns_addr_time
) < TIMEOUT_DEFAULT
) {
78 *pdns_addr
= dns_addr
;
82 FixedInfo
= (FIXED_INFO
*)GlobalAlloc(GPTR
, sizeof(FIXED_INFO
));
83 BufLen
= sizeof(FIXED_INFO
);
85 if (ERROR_BUFFER_OVERFLOW
== GetNetworkParams(FixedInfo
, &BufLen
)) {
87 GlobalFree(FixedInfo
);
90 FixedInfo
= GlobalAlloc(GPTR
, BufLen
);
93 if ((ret
= GetNetworkParams(FixedInfo
, &BufLen
)) != ERROR_SUCCESS
) {
94 printf("GetNetworkParams failed. ret = %08x\n", (u_int
)ret
);
96 GlobalFree(FixedInfo
);
102 pIPAddr
= &(FixedInfo
->DnsServerList
);
103 inet_aton(pIPAddr
->IpAddress
.String
, &tmp_addr
);
104 *pdns_addr
= tmp_addr
;
106 dns_addr_time
= curtime
;
108 GlobalFree(FixedInfo
);
114 int get_dns6_addr(struct in6_addr
*pdns6_addr
, uint32_t *scope_id
)
119 static void winsock_cleanup(void)
126 static int get_dns_addr_cached(void *pdns_addr
, void *cached_addr
,
128 struct stat
*cached_stat
, u_int
*cached_time
)
130 struct stat old_stat
;
131 if (curtime
- *cached_time
< TIMEOUT_DEFAULT
) {
132 memcpy(pdns_addr
, cached_addr
, addrlen
);
135 old_stat
= *cached_stat
;
136 if (stat("/etc/resolv.conf", cached_stat
) != 0) {
139 if (cached_stat
->st_dev
== old_stat
.st_dev
140 && cached_stat
->st_ino
== old_stat
.st_ino
141 && cached_stat
->st_size
== old_stat
.st_size
142 && cached_stat
->st_mtime
== old_stat
.st_mtime
) {
143 memcpy(pdns_addr
, cached_addr
, addrlen
);
149 static int get_dns_addr_resolv_conf(int af
, void *pdns_addr
, void *cached_addr
,
150 socklen_t addrlen
, uint32_t *scope_id
,
157 void *tmp_addr
= alloca(addrlen
);
160 f
= fopen("/etc/resolv.conf", "r");
165 fprintf(stderr
, "IP address of your DNS(s): ");
167 while (fgets(buff
, 512, f
) != NULL
) {
168 if (sscanf(buff
, "nameserver%*[ \t]%256s", buff2
) == 1) {
169 char *c
= strchr(buff2
, '%');
171 if_index
= if_nametoindex(c
+ 1);
177 if (!inet_pton(af
, buff2
, tmp_addr
)) {
180 /* If it's the first one, set it to dns_addr */
182 memcpy(pdns_addr
, tmp_addr
, addrlen
);
183 memcpy(cached_addr
, tmp_addr
, addrlen
);
185 *scope_id
= if_index
;
187 *cached_time
= curtime
;
191 fprintf(stderr
, ", ");
195 fprintf(stderr
, "(more)");
201 char s
[INET6_ADDRSTRLEN
];
202 const char *res
= inet_ntop(af
, tmp_addr
, s
, sizeof(s
));
204 res
= "(string conversion error)";
206 fprintf(stderr
, "%s", res
);
217 int get_dns_addr(struct in_addr
*pdns_addr
)
219 static struct stat dns_addr_stat
;
221 if (dns_addr
.s_addr
!= 0) {
223 ret
= get_dns_addr_cached(pdns_addr
, &dns_addr
, sizeof(dns_addr
),
224 &dns_addr_stat
, &dns_addr_time
);
229 return get_dns_addr_resolv_conf(AF_INET
, pdns_addr
, &dns_addr
,
230 sizeof(dns_addr
), NULL
, &dns_addr_time
);
233 int get_dns6_addr(struct in6_addr
*pdns6_addr
, uint32_t *scope_id
)
235 static struct stat dns6_addr_stat
;
237 if (!in6_zero(&dns6_addr
)) {
239 ret
= get_dns_addr_cached(pdns6_addr
, &dns6_addr
, sizeof(dns6_addr
),
240 &dns6_addr_stat
, &dns6_addr_time
);
245 return get_dns_addr_resolv_conf(AF_INET6
, pdns6_addr
, &dns6_addr
,
247 scope_id
, &dns6_addr_time
);
252 static void slirp_init_once(void)
254 static int initialized
;
265 WSAStartup(MAKEWORD(2,0), &Data
);
266 atexit(winsock_cleanup
);
269 loopback_addr
.s_addr
= htonl(INADDR_LOOPBACK
);
270 loopback_mask
= htonl(IN_CLASSA_NET
);
273 static void slirp_state_save(QEMUFile
*f
, void *opaque
);
274 static int slirp_state_load(QEMUFile
*f
, void *opaque
, int version_id
);
276 static SaveVMHandlers savevm_slirp_state
= {
277 .save_state
= slirp_state_save
,
278 .load_state
= slirp_state_load
,
281 Slirp
*slirp_init(int restricted
, bool in_enabled
, struct in_addr vnetwork
,
282 struct in_addr vnetmask
, struct in_addr vhost
,
284 struct in6_addr vprefix_addr6
, uint8_t vprefix_len
,
285 struct in6_addr vhost6
, const char *vhostname
,
286 const char *tftp_server_name
,
287 const char *tftp_path
, const char *bootfile
,
288 struct in_addr vdhcp_start
, struct in_addr vnameserver
,
289 struct in6_addr vnameserver6
, const char **vdnssearch
,
290 const char *vdomainname
,
291 const SlirpCb
*callbacks
,
294 Slirp
*slirp
= g_malloc0(sizeof(Slirp
));
298 slirp
->cb
= callbacks
;
299 slirp
->grand
= g_rand_new();
300 slirp
->restricted
= restricted
;
302 slirp
->in_enabled
= in_enabled
;
303 slirp
->in6_enabled
= in6_enabled
;
309 /* Initialise mbufs *after* setting the MTU */
312 slirp
->vnetwork_addr
= vnetwork
;
313 slirp
->vnetwork_mask
= vnetmask
;
314 slirp
->vhost_addr
= vhost
;
315 slirp
->vprefix_addr6
= vprefix_addr6
;
316 slirp
->vprefix_len
= vprefix_len
;
317 slirp
->vhost_addr6
= vhost6
;
319 pstrcpy(slirp
->client_hostname
, sizeof(slirp
->client_hostname
),
322 slirp
->tftp_prefix
= g_strdup(tftp_path
);
323 slirp
->bootp_filename
= g_strdup(bootfile
);
324 slirp
->vdomainname
= g_strdup(vdomainname
);
325 slirp
->vdhcp_startaddr
= vdhcp_start
;
326 slirp
->vnameserver_addr
= vnameserver
;
327 slirp
->vnameserver_addr6
= vnameserver6
;
328 slirp
->tftp_server_name
= g_strdup(tftp_server_name
);
331 translate_dnssearch(slirp
, vdnssearch
);
334 slirp
->opaque
= opaque
;
336 register_savevm_live(NULL
, "slirp", 0, 4, &savevm_slirp_state
, slirp
);
338 QTAILQ_INSERT_TAIL(&slirp_instances
, slirp
, entry
);
343 void slirp_cleanup(Slirp
*slirp
)
345 struct ex_list
*e
, *next
;
347 for (e
= slirp
->exec_list
; e
; e
= next
) {
353 QTAILQ_REMOVE(&slirp_instances
, slirp
, entry
);
355 unregister_savevm(NULL
, "slirp", slirp
);
361 g_rand_free(slirp
->grand
);
363 g_free(slirp
->vdnssearch
);
364 g_free(slirp
->tftp_prefix
);
365 g_free(slirp
->bootp_filename
);
366 g_free(slirp
->vdomainname
);
370 #define CONN_CANFSEND(so) (((so)->so_state & (SS_FCANTSENDMORE|SS_ISFCONNECTED)) == SS_ISFCONNECTED)
371 #define CONN_CANFRCV(so) (((so)->so_state & (SS_FCANTRCVMORE|SS_ISFCONNECTED)) == SS_ISFCONNECTED)
373 static void slirp_update_timeout(uint32_t *timeout
)
378 if (*timeout
<= TIMEOUT_FAST
) {
382 t
= MIN(1000, *timeout
);
384 /* If we have tcp timeout with slirp, then we will fill @timeout with
385 * more precise value.
387 QTAILQ_FOREACH(slirp
, &slirp_instances
, entry
) {
388 if (slirp
->time_fasttimo
) {
389 *timeout
= TIMEOUT_FAST
;
392 if (slirp
->do_slowtimo
) {
393 t
= MIN(TIMEOUT_SLOW
, t
);
399 void slirp_pollfds_fill(GArray
*pollfds
, uint32_t *timeout
)
402 struct socket
*so
, *so_next
;
404 if (QTAILQ_EMPTY(&slirp_instances
)) {
412 QTAILQ_FOREACH(slirp
, &slirp_instances
, entry
) {
414 * *_slowtimo needs calling if there are IP fragments
415 * in the fragment queue, or there are TCP connections active
417 slirp
->do_slowtimo
= ((slirp
->tcb
.so_next
!= &slirp
->tcb
) ||
418 (&slirp
->ipq
.ip_link
!= slirp
->ipq
.ip_link
.next
));
420 for (so
= slirp
->tcb
.so_next
; so
!= &slirp
->tcb
;
424 so_next
= so
->so_next
;
426 so
->pollfds_idx
= -1;
429 * See if we need a tcp_fasttimo
431 if (slirp
->time_fasttimo
== 0 &&
432 so
->so_tcpcb
->t_flags
& TF_DELACK
) {
433 slirp
->time_fasttimo
= curtime
; /* Flag when want a fasttimo */
437 * NOFDREF can include still connecting to local-host,
438 * newly socreated() sockets etc. Don't want to select these.
440 if (so
->so_state
& SS_NOFDREF
|| so
->s
== -1) {
445 * Set for reading sockets which are accepting
447 if (so
->so_state
& SS_FACCEPTCONN
) {
450 .events
= G_IO_IN
| G_IO_HUP
| G_IO_ERR
,
452 so
->pollfds_idx
= pollfds
->len
;
453 g_array_append_val(pollfds
, pfd
);
458 * Set for writing sockets which are connecting
460 if (so
->so_state
& SS_ISFCONNECTING
) {
463 .events
= G_IO_OUT
| G_IO_ERR
,
465 so
->pollfds_idx
= pollfds
->len
;
466 g_array_append_val(pollfds
, pfd
);
471 * Set for writing if we are connected, can send more, and
472 * we have something to send
474 if (CONN_CANFSEND(so
) && so
->so_rcv
.sb_cc
) {
475 events
|= G_IO_OUT
| G_IO_ERR
;
479 * Set for reading (and urgent data) if we are connected, can
480 * receive more, and we have room for it XXX /2 ?
482 if (CONN_CANFRCV(so
) &&
483 (so
->so_snd
.sb_cc
< (so
->so_snd
.sb_datalen
/2))) {
484 events
|= G_IO_IN
| G_IO_HUP
| G_IO_ERR
| G_IO_PRI
;
492 so
->pollfds_idx
= pollfds
->len
;
493 g_array_append_val(pollfds
, pfd
);
500 for (so
= slirp
->udb
.so_next
; so
!= &slirp
->udb
;
502 so_next
= so
->so_next
;
504 so
->pollfds_idx
= -1;
507 * See if it's timed out
510 if (so
->so_expire
<= curtime
) {
514 slirp
->do_slowtimo
= true; /* Let socket expire */
519 * When UDP packets are received from over the
520 * link, they're sendto()'d straight away, so
521 * no need for setting for writing
522 * Limit the number of packets queued by this session
523 * to 4. Note that even though we try and limit this
524 * to 4 packets, the session could have more queued
525 * if the packets needed to be fragmented
528 if ((so
->so_state
& SS_ISFCONNECTED
) && so
->so_queued
<= 4) {
531 .events
= G_IO_IN
| G_IO_HUP
| G_IO_ERR
,
533 so
->pollfds_idx
= pollfds
->len
;
534 g_array_append_val(pollfds
, pfd
);
541 for (so
= slirp
->icmp
.so_next
; so
!= &slirp
->icmp
;
543 so_next
= so
->so_next
;
545 so
->pollfds_idx
= -1;
548 * See if it's timed out
551 if (so
->so_expire
<= curtime
) {
555 slirp
->do_slowtimo
= true; /* Let socket expire */
559 if (so
->so_state
& SS_ISFCONNECTED
) {
562 .events
= G_IO_IN
| G_IO_HUP
| G_IO_ERR
,
564 so
->pollfds_idx
= pollfds
->len
;
565 g_array_append_val(pollfds
, pfd
);
569 slirp_update_timeout(timeout
);
572 void slirp_pollfds_poll(GArray
*pollfds
, int select_error
)
575 struct socket
*so
, *so_next
;
578 if (QTAILQ_EMPTY(&slirp_instances
)) {
582 curtime
= qemu_clock_get_ms(QEMU_CLOCK_REALTIME
);
584 QTAILQ_FOREACH(slirp
, &slirp_instances
, entry
) {
586 * See if anything has timed out
588 if (slirp
->time_fasttimo
&&
589 ((curtime
- slirp
->time_fasttimo
) >= TIMEOUT_FAST
)) {
591 slirp
->time_fasttimo
= 0;
593 if (slirp
->do_slowtimo
&&
594 ((curtime
- slirp
->last_slowtimo
) >= TIMEOUT_SLOW
)) {
597 slirp
->last_slowtimo
= curtime
;
607 for (so
= slirp
->tcb
.so_next
; so
!= &slirp
->tcb
;
611 so_next
= so
->so_next
;
614 if (so
->pollfds_idx
!= -1) {
615 revents
= g_array_index(pollfds
, GPollFD
,
616 so
->pollfds_idx
).revents
;
619 if (so
->so_state
& SS_NOFDREF
|| so
->s
== -1) {
625 * This will soread as well, so no need to
626 * test for G_IO_IN below if this succeeds
628 if (revents
& G_IO_PRI
) {
631 /* Socket error might have resulted in the socket being
632 * removed, do not try to do anything more with it. */
637 * Check sockets for reading
639 else if (revents
& (G_IO_IN
| G_IO_HUP
| G_IO_ERR
)) {
641 * Check for incoming connections
643 if (so
->so_state
& SS_FACCEPTCONN
) {
649 /* Output it if we read something */
651 tcp_output(sototcpcb(so
));
654 /* Socket error might have resulted in the socket being
655 * removed, do not try to do anything more with it. */
661 * Check sockets for writing
663 if (!(so
->so_state
& SS_NOFDREF
) &&
664 (revents
& (G_IO_OUT
| G_IO_ERR
))) {
666 * Check for non-blocking, still-connecting sockets
668 if (so
->so_state
& SS_ISFCONNECTING
) {
670 so
->so_state
&= ~SS_ISFCONNECTING
;
672 ret
= send(so
->s
, (const void *) &ret
, 0, 0);
674 /* XXXXX Must fix, zero bytes is a NOP */
675 if (errno
== EAGAIN
|| errno
== EWOULDBLOCK
||
676 errno
== EINPROGRESS
|| errno
== ENOTCONN
) {
681 so
->so_state
&= SS_PERSISTENT_MASK
;
682 so
->so_state
|= SS_NOFDREF
;
684 /* else so->so_state &= ~SS_ISFCONNECTING; */
689 tcp_input((struct mbuf
*)NULL
, sizeof(struct ip
), so
,
695 /* Call tcp_output in case we need to send a window
696 * update to the guest, otherwise it will be stuck
697 * until it sends a window probe. */
698 tcp_output(sototcpcb(so
));
706 * Incoming packets are sent straight away, they're not buffered.
707 * Incoming UDP data isn't buffered either.
709 for (so
= slirp
->udb
.so_next
; so
!= &slirp
->udb
;
713 so_next
= so
->so_next
;
716 if (so
->pollfds_idx
!= -1) {
717 revents
= g_array_index(pollfds
, GPollFD
,
718 so
->pollfds_idx
).revents
;
722 (revents
& (G_IO_IN
| G_IO_HUP
| G_IO_ERR
))) {
728 * Check incoming ICMP relies.
730 for (so
= slirp
->icmp
.so_next
; so
!= &slirp
->icmp
;
734 so_next
= so
->so_next
;
737 if (so
->pollfds_idx
!= -1) {
738 revents
= g_array_index(pollfds
, GPollFD
,
739 so
->pollfds_idx
).revents
;
743 (revents
& (G_IO_IN
| G_IO_HUP
| G_IO_ERR
))) {
753 static void arp_input(Slirp
*slirp
, const uint8_t *pkt
, int pkt_len
)
755 struct slirp_arphdr
*ah
= (struct slirp_arphdr
*)(pkt
+ ETH_HLEN
);
756 uint8_t arp_reply
[MAX(ETH_HLEN
+ sizeof(struct slirp_arphdr
), 64)];
757 struct ethhdr
*reh
= (struct ethhdr
*)arp_reply
;
758 struct slirp_arphdr
*rah
= (struct slirp_arphdr
*)(arp_reply
+ ETH_HLEN
);
760 struct ex_list
*ex_ptr
;
762 if (!slirp
->in_enabled
) {
766 ar_op
= ntohs(ah
->ar_op
);
769 if (ah
->ar_tip
== ah
->ar_sip
) {
771 arp_table_add(slirp
, ah
->ar_sip
, ah
->ar_sha
);
775 if ((ah
->ar_tip
& slirp
->vnetwork_mask
.s_addr
) ==
776 slirp
->vnetwork_addr
.s_addr
) {
777 if (ah
->ar_tip
== slirp
->vnameserver_addr
.s_addr
||
778 ah
->ar_tip
== slirp
->vhost_addr
.s_addr
)
780 for (ex_ptr
= slirp
->exec_list
; ex_ptr
; ex_ptr
= ex_ptr
->ex_next
) {
781 if (ex_ptr
->ex_addr
.s_addr
== ah
->ar_tip
)
786 memset(arp_reply
, 0, sizeof(arp_reply
));
788 arp_table_add(slirp
, ah
->ar_sip
, ah
->ar_sha
);
790 /* ARP request for alias/dns mac address */
791 memcpy(reh
->h_dest
, pkt
+ ETH_ALEN
, ETH_ALEN
);
792 memcpy(reh
->h_source
, special_ethaddr
, ETH_ALEN
- 4);
793 memcpy(&reh
->h_source
[2], &ah
->ar_tip
, 4);
794 reh
->h_proto
= htons(ETH_P_ARP
);
796 rah
->ar_hrd
= htons(1);
797 rah
->ar_pro
= htons(ETH_P_IP
);
798 rah
->ar_hln
= ETH_ALEN
;
800 rah
->ar_op
= htons(ARPOP_REPLY
);
801 memcpy(rah
->ar_sha
, reh
->h_source
, ETH_ALEN
);
802 rah
->ar_sip
= ah
->ar_tip
;
803 memcpy(rah
->ar_tha
, ah
->ar_sha
, ETH_ALEN
);
804 rah
->ar_tip
= ah
->ar_sip
;
805 slirp
->cb
->output(slirp
->opaque
, arp_reply
, sizeof(arp_reply
));
809 arp_table_add(slirp
, ah
->ar_sip
, ah
->ar_sha
);
816 void slirp_input(Slirp
*slirp
, const uint8_t *pkt
, int pkt_len
)
821 if (pkt_len
< ETH_HLEN
)
824 proto
= ntohs(*(uint16_t *)(pkt
+ 12));
827 arp_input(slirp
, pkt
, pkt_len
);
834 /* Note: we add 2 to align the IP header on 4 bytes,
835 * and add the margin for the tcpiphdr overhead */
836 if (M_FREEROOM(m
) < pkt_len
+ TCPIPHDR_DELTA
+ 2) {
837 m_inc(m
, pkt_len
+ TCPIPHDR_DELTA
+ 2);
839 m
->m_len
= pkt_len
+ TCPIPHDR_DELTA
+ 2;
840 memcpy(m
->m_data
+ TCPIPHDR_DELTA
+ 2, pkt
, pkt_len
);
842 m
->m_data
+= TCPIPHDR_DELTA
+ 2 + ETH_HLEN
;
843 m
->m_len
-= TCPIPHDR_DELTA
+ 2 + ETH_HLEN
;
845 if (proto
== ETH_P_IP
) {
847 } else if (proto
== ETH_P_IPV6
) {
853 ncsi_input(slirp
, pkt
, pkt_len
);
861 /* Prepare the IPv4 packet to be sent to the ethernet device. Returns 1 if no
862 * packet should be sent, 0 if the packet must be re-queued, 2 if the packet
865 static int if_encap4(Slirp
*slirp
, struct mbuf
*ifm
, struct ethhdr
*eh
,
866 uint8_t ethaddr
[ETH_ALEN
])
868 const struct ip
*iph
= (const struct ip
*)ifm
->m_data
;
870 if (iph
->ip_dst
.s_addr
== 0) {
871 /* 0.0.0.0 can not be a destination address, something went wrong,
872 * avoid making it worse */
875 if (!arp_table_search(slirp
, iph
->ip_dst
.s_addr
, ethaddr
)) {
876 uint8_t arp_req
[ETH_HLEN
+ sizeof(struct slirp_arphdr
)];
877 struct ethhdr
*reh
= (struct ethhdr
*)arp_req
;
878 struct slirp_arphdr
*rah
= (struct slirp_arphdr
*)(arp_req
+ ETH_HLEN
);
880 if (!ifm
->resolution_requested
) {
881 /* If the client addr is not known, send an ARP request */
882 memset(reh
->h_dest
, 0xff, ETH_ALEN
);
883 memcpy(reh
->h_source
, special_ethaddr
, ETH_ALEN
- 4);
884 memcpy(&reh
->h_source
[2], &slirp
->vhost_addr
, 4);
885 reh
->h_proto
= htons(ETH_P_ARP
);
886 rah
->ar_hrd
= htons(1);
887 rah
->ar_pro
= htons(ETH_P_IP
);
888 rah
->ar_hln
= ETH_ALEN
;
890 rah
->ar_op
= htons(ARPOP_REQUEST
);
893 memcpy(rah
->ar_sha
, special_ethaddr
, ETH_ALEN
- 4);
894 memcpy(&rah
->ar_sha
[2], &slirp
->vhost_addr
, 4);
897 rah
->ar_sip
= slirp
->vhost_addr
.s_addr
;
899 /* target hw addr (none) */
900 memset(rah
->ar_tha
, 0, ETH_ALEN
);
903 rah
->ar_tip
= iph
->ip_dst
.s_addr
;
904 slirp
->client_ipaddr
= iph
->ip_dst
;
905 slirp
->cb
->output(slirp
->opaque
, arp_req
, sizeof(arp_req
));
906 ifm
->resolution_requested
= true;
908 /* Expire request and drop outgoing packet after 1 second */
909 ifm
->expiration_date
= qemu_clock_get_ns(QEMU_CLOCK_REALTIME
) + 1000000000ULL;
913 memcpy(eh
->h_source
, special_ethaddr
, ETH_ALEN
- 4);
914 /* XXX: not correct */
915 memcpy(&eh
->h_source
[2], &slirp
->vhost_addr
, 4);
916 eh
->h_proto
= htons(ETH_P_IP
);
923 /* Prepare the IPv6 packet to be sent to the ethernet device. Returns 1 if no
924 * packet should be sent, 0 if the packet must be re-queued, 2 if the packet
927 static int if_encap6(Slirp
*slirp
, struct mbuf
*ifm
, struct ethhdr
*eh
,
928 uint8_t ethaddr
[ETH_ALEN
])
930 const struct ip6
*ip6h
= mtod(ifm
, const struct ip6
*);
931 if (!ndp_table_search(slirp
, ip6h
->ip_dst
, ethaddr
)) {
932 if (!ifm
->resolution_requested
) {
933 ndp_send_ns(slirp
, ip6h
->ip_dst
);
934 ifm
->resolution_requested
= true;
935 ifm
->expiration_date
=
936 qemu_clock_get_ns(QEMU_CLOCK_REALTIME
) + 1000000000ULL;
940 eh
->h_proto
= htons(ETH_P_IPV6
);
941 in6_compute_ethaddr(ip6h
->ip_src
, eh
->h_source
);
948 /* Output the IP packet to the ethernet device. Returns 0 if the packet must be
951 int if_encap(Slirp
*slirp
, struct mbuf
*ifm
)
954 struct ethhdr
*eh
= (struct ethhdr
*)buf
;
955 uint8_t ethaddr
[ETH_ALEN
];
956 const struct ip
*iph
= (const struct ip
*)ifm
->m_data
;
959 if (ifm
->m_len
+ ETH_HLEN
> sizeof(buf
)) {
965 ret
= if_encap4(slirp
, ifm
, eh
, ethaddr
);
972 ret
= if_encap6(slirp
, ifm
, eh
, ethaddr
);
979 g_assert_not_reached();
983 memcpy(eh
->h_dest
, ethaddr
, ETH_ALEN
);
984 DEBUG_ARGS((dfd
, " src = %02x:%02x:%02x:%02x:%02x:%02x\n",
985 eh
->h_source
[0], eh
->h_source
[1], eh
->h_source
[2],
986 eh
->h_source
[3], eh
->h_source
[4], eh
->h_source
[5]));
987 DEBUG_ARGS((dfd
, " dst = %02x:%02x:%02x:%02x:%02x:%02x\n",
988 eh
->h_dest
[0], eh
->h_dest
[1], eh
->h_dest
[2],
989 eh
->h_dest
[3], eh
->h_dest
[4], eh
->h_dest
[5]));
990 memcpy(buf
+ sizeof(struct ethhdr
), ifm
->m_data
, ifm
->m_len
);
991 slirp
->cb
->output(slirp
->opaque
, buf
, ifm
->m_len
+ ETH_HLEN
);
995 /* Drop host forwarding rule, return 0 if found. */
996 int slirp_remove_hostfwd(Slirp
*slirp
, int is_udp
, struct in_addr host_addr
,
1000 struct socket
*head
= (is_udp
? &slirp
->udb
: &slirp
->tcb
);
1001 struct sockaddr_in addr
;
1002 int port
= htons(host_port
);
1005 for (so
= head
->so_next
; so
!= head
; so
= so
->so_next
) {
1006 addr_len
= sizeof(addr
);
1007 if ((so
->so_state
& SS_HOSTFWD
) &&
1008 getsockname(so
->s
, (struct sockaddr
*)&addr
, &addr_len
) == 0 &&
1009 addr
.sin_addr
.s_addr
== host_addr
.s_addr
&&
1010 addr
.sin_port
== port
) {
1020 int slirp_add_hostfwd(Slirp
*slirp
, int is_udp
, struct in_addr host_addr
,
1021 int host_port
, struct in_addr guest_addr
, int guest_port
)
1023 if (!guest_addr
.s_addr
) {
1024 guest_addr
= slirp
->vdhcp_startaddr
;
1027 if (!udp_listen(slirp
, host_addr
.s_addr
, htons(host_port
),
1028 guest_addr
.s_addr
, htons(guest_port
), SS_HOSTFWD
))
1031 if (!tcp_listen(slirp
, host_addr
.s_addr
, htons(host_port
),
1032 guest_addr
.s_addr
, htons(guest_port
), SS_HOSTFWD
))
1038 int slirp_add_exec(Slirp
*slirp
, void *chardev
, const char *cmdline
,
1039 struct in_addr
*guest_addr
, int guest_port
)
1041 if (!guest_addr
->s_addr
) {
1042 guest_addr
->s_addr
= slirp
->vnetwork_addr
.s_addr
|
1043 (htonl(0x0204) & ~slirp
->vnetwork_mask
.s_addr
);
1045 if ((guest_addr
->s_addr
& slirp
->vnetwork_mask
.s_addr
) !=
1046 slirp
->vnetwork_addr
.s_addr
||
1047 guest_addr
->s_addr
== slirp
->vhost_addr
.s_addr
||
1048 guest_addr
->s_addr
== slirp
->vnameserver_addr
.s_addr
) {
1052 return add_exec(&slirp
->exec_list
, chardev
, cmdline
, *guest_addr
,
1056 ssize_t
slirp_send(struct socket
*so
, const void *buf
, size_t len
, int flags
)
1058 if (so
->s
== -1 && so
->chardev
) {
1059 /* XXX this blocks entire thread. Rewrite to use
1060 * qemu_chr_fe_write and background I/O callbacks */
1061 qemu_chr_fe_write_all(so
->chardev
, buf
, len
);
1067 * This should in theory not happen but it is hard to be
1068 * sure because some code paths will end up with so->s == -1
1069 * on a failure but don't dispose of the struct socket.
1070 * Check specifically, so we don't pass -1 to send().
1076 return send(so
->s
, buf
, len
, flags
);
1079 static struct socket
*
1080 slirp_find_ctl_socket(Slirp
*slirp
, struct in_addr guest_addr
, int guest_port
)
1084 for (so
= slirp
->tcb
.so_next
; so
!= &slirp
->tcb
; so
= so
->so_next
) {
1085 if (so
->so_faddr
.s_addr
== guest_addr
.s_addr
&&
1086 htons(so
->so_fport
) == guest_port
) {
1093 size_t slirp_socket_can_recv(Slirp
*slirp
, struct in_addr guest_addr
,
1096 struct iovec iov
[2];
1099 so
= slirp_find_ctl_socket(slirp
, guest_addr
, guest_port
);
1101 if (!so
|| so
->so_state
& SS_NOFDREF
) {
1105 if (!CONN_CANFRCV(so
) || so
->so_snd
.sb_cc
>= (so
->so_snd
.sb_datalen
/2)) {
1109 return sopreprbuf(so
, iov
, NULL
);
1112 void slirp_socket_recv(Slirp
*slirp
, struct in_addr guest_addr
, int guest_port
,
1113 const uint8_t *buf
, int size
)
1116 struct socket
*so
= slirp_find_ctl_socket(slirp
, guest_addr
, guest_port
);
1121 ret
= soreadbuf(so
, (const char *)buf
, size
);
1124 tcp_output(sototcpcb(so
));
1127 static int slirp_tcp_post_load(void *opaque
, int version
)
1129 tcp_template((struct tcpcb
*)opaque
);
1134 static const VMStateDescription vmstate_slirp_tcp
= {
1135 .name
= "slirp-tcp",
1137 .post_load
= slirp_tcp_post_load
,
1138 .fields
= (VMStateField
[]) {
1139 VMSTATE_INT16(t_state
, struct tcpcb
),
1140 VMSTATE_INT16_ARRAY(t_timer
, struct tcpcb
, TCPT_NTIMERS
),
1141 VMSTATE_INT16(t_rxtshift
, struct tcpcb
),
1142 VMSTATE_INT16(t_rxtcur
, struct tcpcb
),
1143 VMSTATE_INT16(t_dupacks
, struct tcpcb
),
1144 VMSTATE_UINT16(t_maxseg
, struct tcpcb
),
1145 VMSTATE_UINT8(t_force
, struct tcpcb
),
1146 VMSTATE_UINT16(t_flags
, struct tcpcb
),
1147 VMSTATE_UINT32(snd_una
, struct tcpcb
),
1148 VMSTATE_UINT32(snd_nxt
, struct tcpcb
),
1149 VMSTATE_UINT32(snd_up
, struct tcpcb
),
1150 VMSTATE_UINT32(snd_wl1
, struct tcpcb
),
1151 VMSTATE_UINT32(snd_wl2
, struct tcpcb
),
1152 VMSTATE_UINT32(iss
, struct tcpcb
),
1153 VMSTATE_UINT32(snd_wnd
, struct tcpcb
),
1154 VMSTATE_UINT32(rcv_wnd
, struct tcpcb
),
1155 VMSTATE_UINT32(rcv_nxt
, struct tcpcb
),
1156 VMSTATE_UINT32(rcv_up
, struct tcpcb
),
1157 VMSTATE_UINT32(irs
, struct tcpcb
),
1158 VMSTATE_UINT32(rcv_adv
, struct tcpcb
),
1159 VMSTATE_UINT32(snd_max
, struct tcpcb
),
1160 VMSTATE_UINT32(snd_cwnd
, struct tcpcb
),
1161 VMSTATE_UINT32(snd_ssthresh
, struct tcpcb
),
1162 VMSTATE_INT16(t_idle
, struct tcpcb
),
1163 VMSTATE_INT16(t_rtt
, struct tcpcb
),
1164 VMSTATE_UINT32(t_rtseq
, struct tcpcb
),
1165 VMSTATE_INT16(t_srtt
, struct tcpcb
),
1166 VMSTATE_INT16(t_rttvar
, struct tcpcb
),
1167 VMSTATE_UINT16(t_rttmin
, struct tcpcb
),
1168 VMSTATE_UINT32(max_sndwnd
, struct tcpcb
),
1169 VMSTATE_UINT8(t_oobflags
, struct tcpcb
),
1170 VMSTATE_UINT8(t_iobc
, struct tcpcb
),
1171 VMSTATE_INT16(t_softerror
, struct tcpcb
),
1172 VMSTATE_UINT8(snd_scale
, struct tcpcb
),
1173 VMSTATE_UINT8(rcv_scale
, struct tcpcb
),
1174 VMSTATE_UINT8(request_r_scale
, struct tcpcb
),
1175 VMSTATE_UINT8(requested_s_scale
, struct tcpcb
),
1176 VMSTATE_UINT32(ts_recent
, struct tcpcb
),
1177 VMSTATE_UINT32(ts_recent_age
, struct tcpcb
),
1178 VMSTATE_UINT32(last_ack_sent
, struct tcpcb
),
1179 VMSTATE_END_OF_LIST()
1183 /* The sbuf has a pair of pointers that are migrated as offsets;
1184 * we calculate the offsets and restore the pointers using
1185 * pre_save/post_load on a tmp structure.
1188 struct sbuf
*parent
;
1189 uint32_t roff
, woff
;
1192 static int sbuf_tmp_pre_save(void *opaque
)
1194 struct sbuf_tmp
*tmp
= opaque
;
1195 tmp
->woff
= tmp
->parent
->sb_wptr
- tmp
->parent
->sb_data
;
1196 tmp
->roff
= tmp
->parent
->sb_rptr
- tmp
->parent
->sb_data
;
1201 static int sbuf_tmp_post_load(void *opaque
, int version
)
1203 struct sbuf_tmp
*tmp
= opaque
;
1204 uint32_t requested_len
= tmp
->parent
->sb_datalen
;
1206 /* Allocate the buffer space used by the field after the tmp */
1207 sbreserve(tmp
->parent
, tmp
->parent
->sb_datalen
);
1209 if (tmp
->parent
->sb_datalen
!= requested_len
) {
1212 if (tmp
->woff
>= requested_len
||
1213 tmp
->roff
>= requested_len
) {
1214 error_report("invalid sbuf offsets r/w=%u/%u len=%u",
1215 tmp
->roff
, tmp
->woff
, requested_len
);
1219 tmp
->parent
->sb_wptr
= tmp
->parent
->sb_data
+ tmp
->woff
;
1220 tmp
->parent
->sb_rptr
= tmp
->parent
->sb_data
+ tmp
->roff
;
1226 static const VMStateDescription vmstate_slirp_sbuf_tmp
= {
1227 .name
= "slirp-sbuf-tmp",
1228 .post_load
= sbuf_tmp_post_load
,
1229 .pre_save
= sbuf_tmp_pre_save
,
1231 .fields
= (VMStateField
[]) {
1232 VMSTATE_UINT32(woff
, struct sbuf_tmp
),
1233 VMSTATE_UINT32(roff
, struct sbuf_tmp
),
1234 VMSTATE_END_OF_LIST()
1238 static const VMStateDescription vmstate_slirp_sbuf
= {
1239 .name
= "slirp-sbuf",
1241 .fields
= (VMStateField
[]) {
1242 VMSTATE_UINT32(sb_cc
, struct sbuf
),
1243 VMSTATE_UINT32(sb_datalen
, struct sbuf
),
1244 VMSTATE_WITH_TMP(struct sbuf
, struct sbuf_tmp
, vmstate_slirp_sbuf_tmp
),
1245 VMSTATE_VBUFFER_UINT32(sb_data
, struct sbuf
, 0, NULL
, sb_datalen
),
1246 VMSTATE_END_OF_LIST()
1250 static bool slirp_older_than_v4(void *opaque
, int version_id
)
1252 return version_id
< 4;
1255 static bool slirp_family_inet(void *opaque
, int version_id
)
1257 union slirp_sockaddr
*ssa
= (union slirp_sockaddr
*)opaque
;
1258 return ssa
->ss
.ss_family
== AF_INET
;
1261 static int slirp_socket_pre_load(void *opaque
)
1263 struct socket
*so
= opaque
;
1264 if (tcp_attach(so
) < 0) {
1267 /* Older versions don't load these fields */
1268 so
->so_ffamily
= AF_INET
;
1269 so
->so_lfamily
= AF_INET
;
1274 #define VMSTATE_SIN4_ADDR(f, s, t) VMSTATE_UINT32_TEST(f, s, t)
1276 /* Win uses u_long rather than uint32_t - but it's still 32bits long */
1277 #define VMSTATE_SIN4_ADDR(f, s, t) VMSTATE_SINGLE_TEST(f, s, t, 0, \
1278 vmstate_info_uint32, u_long)
1281 /* The OS provided ss_family field isn't that portable; it's size
1282 * and type varies (16/8 bit, signed, unsigned)
1283 * and the values it contains aren't fully portable.
1285 typedef struct SS_FamilyTmpStruct
{
1286 union slirp_sockaddr
*parent
;
1287 uint16_t portable_family
;
1288 } SS_FamilyTmpStruct
;
1290 #define SS_FAMILY_MIG_IPV4 2 /* Linux, BSD, Win... */
1291 #define SS_FAMILY_MIG_IPV6 10 /* Linux */
1292 #define SS_FAMILY_MIG_OTHER 0xffff
1294 static int ss_family_pre_save(void *opaque
)
1296 SS_FamilyTmpStruct
*tss
= opaque
;
1298 tss
->portable_family
= SS_FAMILY_MIG_OTHER
;
1300 if (tss
->parent
->ss
.ss_family
== AF_INET
) {
1301 tss
->portable_family
= SS_FAMILY_MIG_IPV4
;
1302 } else if (tss
->parent
->ss
.ss_family
== AF_INET6
) {
1303 tss
->portable_family
= SS_FAMILY_MIG_IPV6
;
1309 static int ss_family_post_load(void *opaque
, int version_id
)
1311 SS_FamilyTmpStruct
*tss
= opaque
;
1313 switch (tss
->portable_family
) {
1314 case SS_FAMILY_MIG_IPV4
:
1315 tss
->parent
->ss
.ss_family
= AF_INET
;
1317 case SS_FAMILY_MIG_IPV6
:
1318 case 23: /* compatibility: AF_INET6 from mingw */
1319 case 28: /* compatibility: AF_INET6 from FreeBSD sys/socket.h */
1320 tss
->parent
->ss
.ss_family
= AF_INET6
;
1323 error_report("invalid ss_family type %x", tss
->portable_family
);
1330 static const VMStateDescription vmstate_slirp_ss_family
= {
1331 .name
= "slirp-socket-addr/ss_family",
1332 .pre_save
= ss_family_pre_save
,
1333 .post_load
= ss_family_post_load
,
1334 .fields
= (VMStateField
[]) {
1335 VMSTATE_UINT16(portable_family
, SS_FamilyTmpStruct
),
1336 VMSTATE_END_OF_LIST()
1340 static const VMStateDescription vmstate_slirp_socket_addr
= {
1341 .name
= "slirp-socket-addr",
1343 .fields
= (VMStateField
[]) {
1344 VMSTATE_WITH_TMP(union slirp_sockaddr
, SS_FamilyTmpStruct
,
1345 vmstate_slirp_ss_family
),
1346 VMSTATE_SIN4_ADDR(sin
.sin_addr
.s_addr
, union slirp_sockaddr
,
1348 VMSTATE_UINT16_TEST(sin
.sin_port
, union slirp_sockaddr
,
1352 /* Untested: Needs checking by someone with IPv6 test */
1353 VMSTATE_BUFFER_TEST(sin6
.sin6_addr
, union slirp_sockaddr
,
1354 slirp_family_inet6
),
1355 VMSTATE_UINT16_TEST(sin6
.sin6_port
, union slirp_sockaddr
,
1356 slirp_family_inet6
),
1357 VMSTATE_UINT32_TEST(sin6
.sin6_flowinfo
, union slirp_sockaddr
,
1358 slirp_family_inet6
),
1359 VMSTATE_UINT32_TEST(sin6
.sin6_scope_id
, union slirp_sockaddr
,
1360 slirp_family_inet6
),
1363 VMSTATE_END_OF_LIST()
1367 static const VMStateDescription vmstate_slirp_socket
= {
1368 .name
= "slirp-socket",
1370 .pre_load
= slirp_socket_pre_load
,
1371 .fields
= (VMStateField
[]) {
1372 VMSTATE_UINT32(so_urgc
, struct socket
),
1373 /* Pre-v4 versions */
1374 VMSTATE_SIN4_ADDR(so_faddr
.s_addr
, struct socket
,
1375 slirp_older_than_v4
),
1376 VMSTATE_SIN4_ADDR(so_laddr
.s_addr
, struct socket
,
1377 slirp_older_than_v4
),
1378 VMSTATE_UINT16_TEST(so_fport
, struct socket
, slirp_older_than_v4
),
1379 VMSTATE_UINT16_TEST(so_lport
, struct socket
, slirp_older_than_v4
),
1381 VMSTATE_STRUCT(fhost
, struct socket
, 4, vmstate_slirp_socket_addr
,
1382 union slirp_sockaddr
),
1383 VMSTATE_STRUCT(lhost
, struct socket
, 4, vmstate_slirp_socket_addr
,
1384 union slirp_sockaddr
),
1386 VMSTATE_UINT8(so_iptos
, struct socket
),
1387 VMSTATE_UINT8(so_emu
, struct socket
),
1388 VMSTATE_UINT8(so_type
, struct socket
),
1389 VMSTATE_INT32(so_state
, struct socket
),
1390 VMSTATE_STRUCT(so_rcv
, struct socket
, 0, vmstate_slirp_sbuf
,
1392 VMSTATE_STRUCT(so_snd
, struct socket
, 0, vmstate_slirp_sbuf
,
1394 VMSTATE_STRUCT_POINTER(so_tcpcb
, struct socket
, vmstate_slirp_tcp
,
1396 VMSTATE_END_OF_LIST()
1400 static const VMStateDescription vmstate_slirp_bootp_client
= {
1401 .name
= "slirp_bootpclient",
1402 .fields
= (VMStateField
[]) {
1403 VMSTATE_UINT16(allocated
, BOOTPClient
),
1404 VMSTATE_BUFFER(macaddr
, BOOTPClient
),
1405 VMSTATE_END_OF_LIST()
1409 static const VMStateDescription vmstate_slirp
= {
1412 .fields
= (VMStateField
[]) {
1413 VMSTATE_UINT16_V(ip_id
, Slirp
, 2),
1414 VMSTATE_STRUCT_ARRAY(bootp_clients
, Slirp
, NB_BOOTP_CLIENTS
, 3,
1415 vmstate_slirp_bootp_client
, BOOTPClient
),
1416 VMSTATE_END_OF_LIST()
1420 static void slirp_state_save(QEMUFile
*f
, void *opaque
)
1422 Slirp
*slirp
= opaque
;
1423 struct ex_list
*ex_ptr
;
1425 for (ex_ptr
= slirp
->exec_list
; ex_ptr
; ex_ptr
= ex_ptr
->ex_next
)
1426 if (ex_ptr
->ex_chardev
) {
1428 so
= slirp_find_ctl_socket(slirp
, ex_ptr
->ex_addr
,
1429 ntohs(ex_ptr
->ex_fport
));
1433 qemu_put_byte(f
, 42);
1434 vmstate_save_state(f
, &vmstate_slirp_socket
, so
, NULL
);
1436 qemu_put_byte(f
, 0);
1438 vmstate_save_state(f
, &vmstate_slirp
, slirp
, NULL
);
1442 static int slirp_state_load(QEMUFile
*f
, void *opaque
, int version_id
)
1444 Slirp
*slirp
= opaque
;
1445 struct ex_list
*ex_ptr
;
1447 while (qemu_get_byte(f
)) {
1449 struct socket
*so
= socreate(slirp
);
1451 ret
= vmstate_load_state(f
, &vmstate_slirp_socket
, so
, version_id
);
1456 if ((so
->so_faddr
.s_addr
& slirp
->vnetwork_mask
.s_addr
) !=
1457 slirp
->vnetwork_addr
.s_addr
) {
1460 for (ex_ptr
= slirp
->exec_list
; ex_ptr
; ex_ptr
= ex_ptr
->ex_next
) {
1461 if (ex_ptr
->ex_chardev
&&
1462 so
->so_faddr
.s_addr
== ex_ptr
->ex_addr
.s_addr
&&
1463 so
->so_fport
== ex_ptr
->ex_fport
) {
1471 return vmstate_load_state(f
, &vmstate_slirp
, slirp
, version_id
);