4 * Copyright (c) 2004-2008 Fabrice Bellard
6 * Permission is hereby granted, free of charge, to any person obtaining a copy
7 * of this software and associated documentation files (the "Software"), to deal
8 * in the Software without restriction, including without limitation the rights
9 * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
10 * copies of the Software, and to permit persons to whom the Software is
11 * furnished to do so, subject to the following conditions:
13 * The above copyright notice and this permission notice shall be included in
14 * all copies or substantial portions of the Software.
16 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
17 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
18 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
19 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
20 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
21 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
24 #include "qemu/osdep.h"
25 #include "qemu-common.h"
26 #include "qemu/timer.h"
27 #include "qemu/error-report.h"
28 #include "chardev/char-fe.h"
29 #include "migration/register.h"
32 #include "qemu/cutils.h"
38 /* host loopback address */
39 struct in_addr loopback_addr;
40 /* host loopback network mask */
41 unsigned long loopback_mask;
43 /* emulated hosts use the MAC addr 52:55:IP:IP:IP:IP */
44 static const uint8_t special_ethaddr[ETH_ALEN] = {
45 0x52, 0x55, 0x00, 0x00, 0x00, 0x00
50 static QTAILQ_HEAD(, Slirp) slirp_instances =
51 QTAILQ_HEAD_INITIALIZER(slirp_instances);
53 static struct in_addr dns_addr;
55 static struct in6_addr dns6_addr;
57 static u_int dns_addr_time;
59 static u_int dns6_addr_time;
62 #define TIMEOUT_FAST 2 /* milliseconds */
63 #define TIMEOUT_SLOW 499 /* milliseconds */
64 /* for the aging of certain requests like DNS */
65 #define TIMEOUT_DEFAULT 1000 /* milliseconds */
69 int get_dns_addr(struct in_addr *pdns_addr)
71 FIXED_INFO *FixedInfo=NULL;
74 IP_ADDR_STRING *pIPAddr;
75 struct in_addr tmp_addr;
77 if (dns_addr.s_addr != 0 && (curtime - dns_addr_time) < TIMEOUT_DEFAULT) {
78 *pdns_addr = dns_addr;
82 FixedInfo = (FIXED_INFO *)GlobalAlloc(GPTR, sizeof(FIXED_INFO));
83 BufLen = sizeof(FIXED_INFO);
85 if (ERROR_BUFFER_OVERFLOW == GetNetworkParams(FixedInfo, &BufLen)) {
87 GlobalFree(FixedInfo);
90 FixedInfo = GlobalAlloc(GPTR, BufLen);
93 if ((ret = GetNetworkParams(FixedInfo, &BufLen)) != ERROR_SUCCESS) {
94 printf("GetNetworkParams failed. ret = %08x\n", (u_int)ret );
96 GlobalFree(FixedInfo);
102 pIPAddr = &(FixedInfo->DnsServerList);
103 inet_aton(pIPAddr->IpAddress.String, &tmp_addr);
104 *pdns_addr = tmp_addr;
106 dns_addr_time = curtime;
108 GlobalFree(FixedInfo);
114 int get_dns6_addr(struct in6_addr *pdns6_addr, uint32_t *scope_id)
119 static void winsock_cleanup(void)
126 static int get_dns_addr_cached(void *pdns_addr, void *cached_addr,
128 struct stat *cached_stat, u_int *cached_time)
130 struct stat old_stat;
131 if (curtime - *cached_time < TIMEOUT_DEFAULT) {
132 memcpy(pdns_addr, cached_addr, addrlen);
135 old_stat = *cached_stat;
136 if (stat("/etc/resolv.conf", cached_stat) != 0) {
139 if (cached_stat->st_dev == old_stat.st_dev
140 && cached_stat->st_ino == old_stat.st_ino
141 && cached_stat->st_size == old_stat.st_size
142 && cached_stat->st_mtime == old_stat.st_mtime) {
143 memcpy(pdns_addr, cached_addr, addrlen);
149 static int get_dns_addr_resolv_conf(int af, void *pdns_addr, void *cached_addr,
150 socklen_t addrlen, uint32_t *scope_id,
157 void *tmp_addr = alloca(addrlen);
160 f = fopen("/etc/resolv.conf", "r");
165 fprintf(stderr, "IP address of your DNS(s): ");
167 while (fgets(buff, 512, f) != NULL) {
168 if (sscanf(buff, "nameserver%*[ \t]%256s", buff2) == 1) {
169 char *c = strchr(buff2, '%');
171 if_index = if_nametoindex(c + 1);
177 if (!inet_pton(af, buff2, tmp_addr)) {
180 /* If it's the first one, set it to dns_addr */
182 memcpy(pdns_addr, tmp_addr, addrlen);
183 memcpy(cached_addr, tmp_addr, addrlen);
185 *scope_id = if_index;
187 *cached_time = curtime;
191 fprintf(stderr, ", ");
195 fprintf(stderr, "(more)");
201 char s[INET6_ADDRSTRLEN];
202 const char *res = inet_ntop(af, tmp_addr, s, sizeof(s));
204 res = "(string conversion error)";
206 fprintf(stderr, "%s", res);
217 int get_dns_addr(struct in_addr *pdns_addr)
219 static struct stat dns_addr_stat;
221 if (dns_addr.s_addr != 0) {
223 ret = get_dns_addr_cached(pdns_addr, &dns_addr, sizeof(dns_addr),
224 &dns_addr_stat, &dns_addr_time);
229 return get_dns_addr_resolv_conf(AF_INET, pdns_addr, &dns_addr,
230 sizeof(dns_addr), NULL, &dns_addr_time);
233 int get_dns6_addr(struct in6_addr *pdns6_addr, uint32_t *scope_id)
235 static struct stat dns6_addr_stat;
237 if (!in6_zero(&dns6_addr)) {
239 ret = get_dns_addr_cached(pdns6_addr, &dns6_addr, sizeof(dns6_addr),
240 &dns6_addr_stat, &dns6_addr_time);
245 return get_dns_addr_resolv_conf(AF_INET6, pdns6_addr, &dns6_addr,
247 scope_id, &dns6_addr_time);
252 static void slirp_init_once(void)
254 static int initialized;
265 WSAStartup(MAKEWORD(2,0), &Data);
266 atexit(winsock_cleanup);
269 loopback_addr.s_addr = htonl(INADDR_LOOPBACK);
270 loopback_mask = htonl(IN_CLASSA_NET);
273 static void slirp_state_save(QEMUFile *f, void *opaque);
274 static int slirp_state_load(QEMUFile *f, void *opaque, int version_id);
276 static SaveVMHandlers savevm_slirp_state = {
277 .save_state = slirp_state_save,
278 .load_state = slirp_state_load,
281 Slirp *slirp_init(int restricted, bool in_enabled, struct in_addr vnetwork,
282 struct in_addr vnetmask, struct in_addr vhost,
284 struct in6_addr vprefix_addr6, uint8_t vprefix_len,
285 struct in6_addr vhost6, const char *vhostname,
286 const char *tftp_server_name,
287 const char *tftp_path, const char *bootfile,
288 struct in_addr vdhcp_start, struct in_addr vnameserver,
289 struct in6_addr vnameserver6, const char **vdnssearch,
290 const char *vdomainname, void *opaque)
292 Slirp *slirp = g_malloc0(sizeof(Slirp));
296 slirp->grand = g_rand_new();
297 slirp->restricted = restricted;
299 slirp->in_enabled = in_enabled;
300 slirp->in6_enabled = in6_enabled;
306 /* Initialise mbufs *after* setting the MTU */
309 slirp->vnetwork_addr = vnetwork;
310 slirp->vnetwork_mask = vnetmask;
311 slirp->vhost_addr = vhost;
312 slirp->vprefix_addr6 = vprefix_addr6;
313 slirp->vprefix_len = vprefix_len;
314 slirp->vhost_addr6 = vhost6;
316 pstrcpy(slirp->client_hostname, sizeof(slirp->client_hostname),
319 slirp->tftp_prefix = g_strdup(tftp_path);
320 slirp->bootp_filename = g_strdup(bootfile);
321 slirp->vdomainname = g_strdup(vdomainname);
322 slirp->vdhcp_startaddr = vdhcp_start;
323 slirp->vnameserver_addr = vnameserver;
324 slirp->vnameserver_addr6 = vnameserver6;
325 slirp->tftp_server_name = g_strdup(tftp_server_name);
328 translate_dnssearch(slirp, vdnssearch);
331 slirp->opaque = opaque;
333 register_savevm_live(NULL, "slirp", 0, 4, &savevm_slirp_state, slirp);
335 QTAILQ_INSERT_TAIL(&slirp_instances, slirp, entry);
340 void slirp_cleanup(Slirp *slirp)
342 QTAILQ_REMOVE(&slirp_instances, slirp, entry);
344 unregister_savevm(NULL, "slirp", slirp);
350 g_rand_free(slirp->grand);
352 g_free(slirp->vdnssearch);
353 g_free(slirp->tftp_prefix);
354 g_free(slirp->bootp_filename);
355 g_free(slirp->vdomainname);
359 #define CONN_CANFSEND(so) (((so)->so_state & (SS_FCANTSENDMORE|SS_ISFCONNECTED)) == SS_ISFCONNECTED)
360 #define CONN_CANFRCV(so) (((so)->so_state & (SS_FCANTRCVMORE|SS_ISFCONNECTED)) == SS_ISFCONNECTED)
362 static void slirp_update_timeout(uint32_t *timeout)
367 if (*timeout <= TIMEOUT_FAST) {
371 t = MIN(1000, *timeout);
373 /* If we have tcp timeout with slirp, then we will fill @timeout with
374 * more precise value.
376 QTAILQ_FOREACH(slirp, &slirp_instances, entry) {
377 if (slirp->time_fasttimo) {
378 *timeout = TIMEOUT_FAST;
381 if (slirp->do_slowtimo) {
382 t = MIN(TIMEOUT_SLOW, t);
388 void slirp_pollfds_fill(GArray *pollfds, uint32_t *timeout)
391 struct socket *so, *so_next;
393 if (QTAILQ_EMPTY(&slirp_instances)) {
401 QTAILQ_FOREACH(slirp, &slirp_instances, entry) {
403 * *_slowtimo needs calling if there are IP fragments
404 * in the fragment queue, or there are TCP connections active
406 slirp->do_slowtimo = ((slirp->tcb.so_next != &slirp->tcb) ||
407 (&slirp->ipq.ip_link != slirp->ipq.ip_link.next));
409 for (so = slirp->tcb.so_next; so != &slirp->tcb;
413 so_next = so->so_next;
415 so->pollfds_idx = -1;
418 * See if we need a tcp_fasttimo
420 if (slirp->time_fasttimo == 0 &&
421 so->so_tcpcb->t_flags & TF_DELACK) {
422 slirp->time_fasttimo = curtime; /* Flag when want a fasttimo */
426 * NOFDREF can include still connecting to local-host,
427 * newly socreated() sockets etc. Don't want to select these.
429 if (so->so_state & SS_NOFDREF || so->s == -1) {
434 * Set for reading sockets which are accepting
436 if (so->so_state & SS_FACCEPTCONN) {
439 .events = G_IO_IN | G_IO_HUP | G_IO_ERR,
441 so->pollfds_idx = pollfds->len;
442 g_array_append_val(pollfds, pfd);
447 * Set for writing sockets which are connecting
449 if (so->so_state & SS_ISFCONNECTING) {
452 .events = G_IO_OUT | G_IO_ERR,
454 so->pollfds_idx = pollfds->len;
455 g_array_append_val(pollfds, pfd);
460 * Set for writing if we are connected, can send more, and
461 * we have something to send
463 if (CONN_CANFSEND(so) && so->so_rcv.sb_cc) {
464 events |= G_IO_OUT | G_IO_ERR;
468 * Set for reading (and urgent data) if we are connected, can
469 * receive more, and we have room for it XXX /2 ?
471 if (CONN_CANFRCV(so) &&
472 (so->so_snd.sb_cc < (so->so_snd.sb_datalen/2))) {
473 events |= G_IO_IN | G_IO_HUP | G_IO_ERR | G_IO_PRI;
481 so->pollfds_idx = pollfds->len;
482 g_array_append_val(pollfds, pfd);
489 for (so = slirp->udb.so_next; so != &slirp->udb;
491 so_next = so->so_next;
493 so->pollfds_idx = -1;
496 * See if it's timed out
499 if (so->so_expire <= curtime) {
503 slirp->do_slowtimo = true; /* Let socket expire */
508 * When UDP packets are received from over the
509 * link, they're sendto()'d straight away, so
510 * no need for setting for writing
511 * Limit the number of packets queued by this session
512 * to 4. Note that even though we try and limit this
513 * to 4 packets, the session could have more queued
514 * if the packets needed to be fragmented
517 if ((so->so_state & SS_ISFCONNECTED) && so->so_queued <= 4) {
520 .events = G_IO_IN | G_IO_HUP | G_IO_ERR,
522 so->pollfds_idx = pollfds->len;
523 g_array_append_val(pollfds, pfd);
530 for (so = slirp->icmp.so_next; so != &slirp->icmp;
532 so_next = so->so_next;
534 so->pollfds_idx = -1;
537 * See if it's timed out
540 if (so->so_expire <= curtime) {
544 slirp->do_slowtimo = true; /* Let socket expire */
548 if (so->so_state & SS_ISFCONNECTED) {
551 .events = G_IO_IN | G_IO_HUP | G_IO_ERR,
553 so->pollfds_idx = pollfds->len;
554 g_array_append_val(pollfds, pfd);
558 slirp_update_timeout(timeout);
561 void slirp_pollfds_poll(GArray *pollfds, int select_error)
564 struct socket *so, *so_next;
567 if (QTAILQ_EMPTY(&slirp_instances)) {
571 curtime = qemu_clock_get_ms(QEMU_CLOCK_REALTIME);
573 QTAILQ_FOREACH(slirp, &slirp_instances, entry) {
575 * See if anything has timed out
577 if (slirp->time_fasttimo &&
578 ((curtime - slirp->time_fasttimo) >= TIMEOUT_FAST)) {
580 slirp->time_fasttimo = 0;
582 if (slirp->do_slowtimo &&
583 ((curtime - slirp->last_slowtimo) >= TIMEOUT_SLOW)) {
586 slirp->last_slowtimo = curtime;
596 for (so = slirp->tcb.so_next; so != &slirp->tcb;
600 so_next = so->so_next;
603 if (so->pollfds_idx != -1) {
604 revents = g_array_index(pollfds, GPollFD,
605 so->pollfds_idx).revents;
608 if (so->so_state & SS_NOFDREF || so->s == -1) {
614 * This will soread as well, so no need to
615 * test for G_IO_IN below if this succeeds
617 if (revents & G_IO_PRI) {
620 /* Socket error might have resulted in the socket being
621 * removed, do not try to do anything more with it. */
626 * Check sockets for reading
628 else if (revents & (G_IO_IN | G_IO_HUP | G_IO_ERR)) {
630 * Check for incoming connections
632 if (so->so_state & SS_FACCEPTCONN) {
638 /* Output it if we read something */
640 tcp_output(sototcpcb(so));
643 /* Socket error might have resulted in the socket being
644 * removed, do not try to do anything more with it. */
650 * Check sockets for writing
652 if (!(so->so_state & SS_NOFDREF) &&
653 (revents & (G_IO_OUT | G_IO_ERR))) {
655 * Check for non-blocking, still-connecting sockets
657 if (so->so_state & SS_ISFCONNECTING) {
659 so->so_state &= ~SS_ISFCONNECTING;
661 ret = send(so->s, (const void *) &ret, 0, 0);
663 /* XXXXX Must fix, zero bytes is a NOP */
664 if (errno == EAGAIN || errno == EWOULDBLOCK ||
665 errno == EINPROGRESS || errno == ENOTCONN) {
670 so->so_state &= SS_PERSISTENT_MASK;
671 so->so_state |= SS_NOFDREF;
673 /* else so->so_state &= ~SS_ISFCONNECTING; */
678 tcp_input((struct mbuf *)NULL, sizeof(struct ip), so,
684 /* Call tcp_output in case we need to send a window
685 * update to the guest, otherwise it will be stuck
686 * until it sends a window probe. */
687 tcp_output(sototcpcb(so));
693 * Probe a still-connecting, non-blocking socket
694 * to check if it's still alive
697 if (so->so_state & SS_ISFCONNECTING) {
698 ret = qemu_recv(so->s, &ret, 0, 0);
702 if (errno == EAGAIN || errno == EWOULDBLOCK ||
703 errno == EINPROGRESS || errno == ENOTCONN) {
704 continue; /* Still connecting, continue */
708 so->so_state &= SS_PERSISTENT_MASK;
709 so->so_state |= SS_NOFDREF;
711 /* tcp_input will take care of it */
713 ret = send(so->s, &ret, 0, 0);
716 if (errno == EAGAIN || errno == EWOULDBLOCK ||
717 errno == EINPROGRESS || errno == ENOTCONN) {
721 so->so_state &= SS_PERSISTENT_MASK;
722 so->so_state |= SS_NOFDREF;
724 so->so_state &= ~SS_ISFCONNECTING;
728 tcp_input((struct mbuf *)NULL, sizeof(struct ip), so,
730 } /* SS_ISFCONNECTING */
736 * Incoming packets are sent straight away, they're not buffered.
737 * Incoming UDP data isn't buffered either.
739 for (so = slirp->udb.so_next; so != &slirp->udb;
743 so_next = so->so_next;
746 if (so->pollfds_idx != -1) {
747 revents = g_array_index(pollfds, GPollFD,
748 so->pollfds_idx).revents;
752 (revents & (G_IO_IN | G_IO_HUP | G_IO_ERR))) {
758 * Check incoming ICMP relies.
760 for (so = slirp->icmp.so_next; so != &slirp->icmp;
764 so_next = so->so_next;
767 if (so->pollfds_idx != -1) {
768 revents = g_array_index(pollfds, GPollFD,
769 so->pollfds_idx).revents;
773 (revents & (G_IO_IN | G_IO_HUP | G_IO_ERR))) {
783 static void arp_input(Slirp *slirp, const uint8_t *pkt, int pkt_len)
785 struct slirp_arphdr *ah = (struct slirp_arphdr *)(pkt + ETH_HLEN);
786 uint8_t arp_reply[MAX(ETH_HLEN + sizeof(struct slirp_arphdr), 64)];
787 struct ethhdr *reh = (struct ethhdr *)arp_reply;
788 struct slirp_arphdr *rah = (struct slirp_arphdr *)(arp_reply + ETH_HLEN);
790 struct ex_list *ex_ptr;
792 if (!slirp->in_enabled) {
796 ar_op = ntohs(ah->ar_op);
799 if (ah->ar_tip == ah->ar_sip) {
801 arp_table_add(slirp, ah->ar_sip, ah->ar_sha);
805 if ((ah->ar_tip & slirp->vnetwork_mask.s_addr) ==
806 slirp->vnetwork_addr.s_addr) {
807 if (ah->ar_tip == slirp->vnameserver_addr.s_addr ||
808 ah->ar_tip == slirp->vhost_addr.s_addr)
810 for (ex_ptr = slirp->exec_list; ex_ptr; ex_ptr = ex_ptr->ex_next) {
811 if (ex_ptr->ex_addr.s_addr == ah->ar_tip)
816 memset(arp_reply, 0, sizeof(arp_reply));
818 arp_table_add(slirp, ah->ar_sip, ah->ar_sha);
820 /* ARP request for alias/dns mac address */
821 memcpy(reh->h_dest, pkt + ETH_ALEN, ETH_ALEN);
822 memcpy(reh->h_source, special_ethaddr, ETH_ALEN - 4);
823 memcpy(&reh->h_source[2], &ah->ar_tip, 4);
824 reh->h_proto = htons(ETH_P_ARP);
826 rah->ar_hrd = htons(1);
827 rah->ar_pro = htons(ETH_P_IP);
828 rah->ar_hln = ETH_ALEN;
830 rah->ar_op = htons(ARPOP_REPLY);
831 memcpy(rah->ar_sha, reh->h_source, ETH_ALEN);
832 rah->ar_sip = ah->ar_tip;
833 memcpy(rah->ar_tha, ah->ar_sha, ETH_ALEN);
834 rah->ar_tip = ah->ar_sip;
835 slirp_output(slirp->opaque, arp_reply, sizeof(arp_reply));
839 arp_table_add(slirp, ah->ar_sip, ah->ar_sha);
846 void slirp_input(Slirp *slirp, const uint8_t *pkt, int pkt_len)
851 if (pkt_len < ETH_HLEN)
854 proto = ntohs(*(uint16_t *)(pkt + 12));
857 arp_input(slirp, pkt, pkt_len);
864 /* Note: we add 2 to align the IP header on 4 bytes,
865 * and add the margin for the tcpiphdr overhead */
866 if (M_FREEROOM(m) < pkt_len + TCPIPHDR_DELTA + 2) {
867 m_inc(m, pkt_len + TCPIPHDR_DELTA + 2);
869 m->m_len = pkt_len + TCPIPHDR_DELTA + 2;
870 memcpy(m->m_data + TCPIPHDR_DELTA + 2, pkt, pkt_len);
872 m->m_data += TCPIPHDR_DELTA + 2 + ETH_HLEN;
873 m->m_len -= TCPIPHDR_DELTA + 2 + ETH_HLEN;
875 if (proto == ETH_P_IP) {
877 } else if (proto == ETH_P_IPV6) {
883 ncsi_input(slirp, pkt, pkt_len);
891 /* Prepare the IPv4 packet to be sent to the ethernet device. Returns 1 if no
892 * packet should be sent, 0 if the packet must be re-queued, 2 if the packet
895 static int if_encap4(Slirp *slirp, struct mbuf *ifm, struct ethhdr *eh,
896 uint8_t ethaddr[ETH_ALEN])
898 const struct ip *iph = (const struct ip *)ifm->m_data;
900 if (iph->ip_dst.s_addr == 0) {
901 /* 0.0.0.0 can not be a destination address, something went wrong,
902 * avoid making it worse */
905 if (!arp_table_search(slirp, iph->ip_dst.s_addr, ethaddr)) {
906 uint8_t arp_req[ETH_HLEN + sizeof(struct slirp_arphdr)];
907 struct ethhdr *reh = (struct ethhdr *)arp_req;
908 struct slirp_arphdr *rah = (struct slirp_arphdr *)(arp_req + ETH_HLEN);
910 if (!ifm->resolution_requested) {
911 /* If the client addr is not known, send an ARP request */
912 memset(reh->h_dest, 0xff, ETH_ALEN);
913 memcpy(reh->h_source, special_ethaddr, ETH_ALEN - 4);
914 memcpy(&reh->h_source[2], &slirp->vhost_addr, 4);
915 reh->h_proto = htons(ETH_P_ARP);
916 rah->ar_hrd = htons(1);
917 rah->ar_pro = htons(ETH_P_IP);
918 rah->ar_hln = ETH_ALEN;
920 rah->ar_op = htons(ARPOP_REQUEST);
923 memcpy(rah->ar_sha, special_ethaddr, ETH_ALEN - 4);
924 memcpy(&rah->ar_sha[2], &slirp->vhost_addr, 4);
927 rah->ar_sip = slirp->vhost_addr.s_addr;
929 /* target hw addr (none) */
930 memset(rah->ar_tha, 0, ETH_ALEN);
933 rah->ar_tip = iph->ip_dst.s_addr;
934 slirp->client_ipaddr = iph->ip_dst;
935 slirp_output(slirp->opaque, arp_req, sizeof(arp_req));
936 ifm->resolution_requested = true;
938 /* Expire request and drop outgoing packet after 1 second */
939 ifm->expiration_date = qemu_clock_get_ns(QEMU_CLOCK_REALTIME) + 1000000000ULL;
943 memcpy(eh->h_source, special_ethaddr, ETH_ALEN - 4);
944 /* XXX: not correct */
945 memcpy(&eh->h_source[2], &slirp->vhost_addr, 4);
946 eh->h_proto = htons(ETH_P_IP);
953 /* Prepare the IPv6 packet to be sent to the ethernet device. Returns 1 if no
954 * packet should be sent, 0 if the packet must be re-queued, 2 if the packet
957 static int if_encap6(Slirp *slirp, struct mbuf *ifm, struct ethhdr *eh,
958 uint8_t ethaddr[ETH_ALEN])
960 const struct ip6 *ip6h = mtod(ifm, const struct ip6 *);
961 if (!ndp_table_search(slirp, ip6h->ip_dst, ethaddr)) {
962 if (!ifm->resolution_requested) {
963 ndp_send_ns(slirp, ip6h->ip_dst);
964 ifm->resolution_requested = true;
965 ifm->expiration_date =
966 qemu_clock_get_ns(QEMU_CLOCK_REALTIME) + 1000000000ULL;
970 eh->h_proto = htons(ETH_P_IPV6);
971 in6_compute_ethaddr(ip6h->ip_src, eh->h_source);
978 /* Output the IP packet to the ethernet device. Returns 0 if the packet must be
981 int if_encap(Slirp *slirp, struct mbuf *ifm)
984 struct ethhdr *eh = (struct ethhdr *)buf;
985 uint8_t ethaddr[ETH_ALEN];
986 const struct ip *iph = (const struct ip *)ifm->m_data;
989 if (ifm->m_len + ETH_HLEN > sizeof(buf)) {
995 ret = if_encap4(slirp, ifm, eh, ethaddr);
1002 ret = if_encap6(slirp, ifm, eh, ethaddr);
1009 g_assert_not_reached();
1013 memcpy(eh->h_dest, ethaddr, ETH_ALEN);
1014 DEBUG_ARGS((dfd, " src = %02x:%02x:%02x:%02x:%02x:%02x\n",
1015 eh->h_source[0], eh->h_source[1], eh->h_source[2],
1016 eh->h_source[3], eh->h_source[4], eh->h_source[5]));
1017 DEBUG_ARGS((dfd, " dst = %02x:%02x:%02x:%02x:%02x:%02x\n",
1018 eh->h_dest[0], eh->h_dest[1], eh->h_dest[2],
1019 eh->h_dest[3], eh->h_dest[4], eh->h_dest[5]));
1020 memcpy(buf + sizeof(struct ethhdr), ifm->m_data, ifm->m_len);
1021 slirp_output(slirp->opaque, buf, ifm->m_len + ETH_HLEN);
1025 /* Drop host forwarding rule, return 0 if found. */
1026 int slirp_remove_hostfwd(Slirp *slirp, int is_udp, struct in_addr host_addr,
1030 struct socket *head = (is_udp ? &slirp->udb : &slirp->tcb);
1031 struct sockaddr_in addr;
1032 int port = htons(host_port);
1035 for (so = head->so_next; so != head; so = so->so_next) {
1036 addr_len = sizeof(addr);
1037 if ((so->so_state & SS_HOSTFWD) &&
1038 getsockname(so->s, (struct sockaddr *)&addr, &addr_len) == 0 &&
1039 addr.sin_addr.s_addr == host_addr.s_addr &&
1040 addr.sin_port == port) {
1050 int slirp_add_hostfwd(Slirp *slirp, int is_udp, struct in_addr host_addr,
1051 int host_port, struct in_addr guest_addr, int guest_port)
1053 if (!guest_addr.s_addr) {
1054 guest_addr = slirp->vdhcp_startaddr;
1057 if (!udp_listen(slirp, host_addr.s_addr, htons(host_port),
1058 guest_addr.s_addr, htons(guest_port), SS_HOSTFWD))
1061 if (!tcp_listen(slirp, host_addr.s_addr, htons(host_port),
1062 guest_addr.s_addr, htons(guest_port), SS_HOSTFWD))
1068 int slirp_add_exec(Slirp *slirp, int do_pty, const void *args,
1069 struct in_addr *guest_addr, int guest_port)
1071 if (!guest_addr->s_addr) {
1072 guest_addr->s_addr = slirp->vnetwork_addr.s_addr |
1073 (htonl(0x0204) & ~slirp->vnetwork_mask.s_addr);
1075 if ((guest_addr->s_addr & slirp->vnetwork_mask.s_addr) !=
1076 slirp->vnetwork_addr.s_addr ||
1077 guest_addr->s_addr == slirp->vhost_addr.s_addr ||
1078 guest_addr->s_addr == slirp->vnameserver_addr.s_addr) {
1081 return add_exec(&slirp->exec_list, do_pty, (char *)args, *guest_addr,
1085 ssize_t slirp_send(struct socket *so, const void *buf, size_t len, int flags)
1087 if (so->s == -1 && so->extra) {
1088 /* XXX this blocks entire thread. Rewrite to use
1089 * qemu_chr_fe_write and background I/O callbacks */
1090 qemu_chr_fe_write_all(so->extra, buf, len);
1096 * This should in theory not happen but it is hard to be
1097 * sure because some code paths will end up with so->s == -1
1098 * on a failure but don't dispose of the struct socket.
1099 * Check specifically, so we don't pass -1 to send().
1105 return send(so->s, buf, len, flags);
1108 static struct socket *
1109 slirp_find_ctl_socket(Slirp *slirp, struct in_addr guest_addr, int guest_port)
1113 for (so = slirp->tcb.so_next; so != &slirp->tcb; so = so->so_next) {
1114 if (so->so_faddr.s_addr == guest_addr.s_addr &&
1115 htons(so->so_fport) == guest_port) {
1122 size_t slirp_socket_can_recv(Slirp *slirp, struct in_addr guest_addr,
1125 struct iovec iov[2];
1128 so = slirp_find_ctl_socket(slirp, guest_addr, guest_port);
1130 if (!so || so->so_state & SS_NOFDREF) {
1134 if (!CONN_CANFRCV(so) || so->so_snd.sb_cc >= (so->so_snd.sb_datalen/2)) {
1138 return sopreprbuf(so, iov, NULL);
1141 void slirp_socket_recv(Slirp *slirp, struct in_addr guest_addr, int guest_port,
1142 const uint8_t *buf, int size)
1145 struct socket *so = slirp_find_ctl_socket(slirp, guest_addr, guest_port);
1150 ret = soreadbuf(so, (const char *)buf, size);
1153 tcp_output(sototcpcb(so));
1156 static int slirp_tcp_post_load(void *opaque, int version)
1158 tcp_template((struct tcpcb *)opaque);
1163 static const VMStateDescription vmstate_slirp_tcp = {
1164 .name = "slirp-tcp",
1166 .post_load = slirp_tcp_post_load,
1167 .fields = (VMStateField[]) {
1168 VMSTATE_INT16(t_state, struct tcpcb),
1169 VMSTATE_INT16_ARRAY(t_timer, struct tcpcb, TCPT_NTIMERS),
1170 VMSTATE_INT16(t_rxtshift, struct tcpcb),
1171 VMSTATE_INT16(t_rxtcur, struct tcpcb),
1172 VMSTATE_INT16(t_dupacks, struct tcpcb),
1173 VMSTATE_UINT16(t_maxseg, struct tcpcb),
1174 VMSTATE_UINT8(t_force, struct tcpcb),
1175 VMSTATE_UINT16(t_flags, struct tcpcb),
1176 VMSTATE_UINT32(snd_una, struct tcpcb),
1177 VMSTATE_UINT32(snd_nxt, struct tcpcb),
1178 VMSTATE_UINT32(snd_up, struct tcpcb),
1179 VMSTATE_UINT32(snd_wl1, struct tcpcb),
1180 VMSTATE_UINT32(snd_wl2, struct tcpcb),
1181 VMSTATE_UINT32(iss, struct tcpcb),
1182 VMSTATE_UINT32(snd_wnd, struct tcpcb),
1183 VMSTATE_UINT32(rcv_wnd, struct tcpcb),
1184 VMSTATE_UINT32(rcv_nxt, struct tcpcb),
1185 VMSTATE_UINT32(rcv_up, struct tcpcb),
1186 VMSTATE_UINT32(irs, struct tcpcb),
1187 VMSTATE_UINT32(rcv_adv, struct tcpcb),
1188 VMSTATE_UINT32(snd_max, struct tcpcb),
1189 VMSTATE_UINT32(snd_cwnd, struct tcpcb),
1190 VMSTATE_UINT32(snd_ssthresh, struct tcpcb),
1191 VMSTATE_INT16(t_idle, struct tcpcb),
1192 VMSTATE_INT16(t_rtt, struct tcpcb),
1193 VMSTATE_UINT32(t_rtseq, struct tcpcb),
1194 VMSTATE_INT16(t_srtt, struct tcpcb),
1195 VMSTATE_INT16(t_rttvar, struct tcpcb),
1196 VMSTATE_UINT16(t_rttmin, struct tcpcb),
1197 VMSTATE_UINT32(max_sndwnd, struct tcpcb),
1198 VMSTATE_UINT8(t_oobflags, struct tcpcb),
1199 VMSTATE_UINT8(t_iobc, struct tcpcb),
1200 VMSTATE_INT16(t_softerror, struct tcpcb),
1201 VMSTATE_UINT8(snd_scale, struct tcpcb),
1202 VMSTATE_UINT8(rcv_scale, struct tcpcb),
1203 VMSTATE_UINT8(request_r_scale, struct tcpcb),
1204 VMSTATE_UINT8(requested_s_scale, struct tcpcb),
1205 VMSTATE_UINT32(ts_recent, struct tcpcb),
1206 VMSTATE_UINT32(ts_recent_age, struct tcpcb),
1207 VMSTATE_UINT32(last_ack_sent, struct tcpcb),
1208 VMSTATE_END_OF_LIST()
1212 /* The sbuf has a pair of pointers that are migrated as offsets;
1213 * we calculate the offsets and restore the pointers using
1214 * pre_save/post_load on a tmp structure.
1217 struct sbuf *parent;
1218 uint32_t roff, woff;
1221 static int sbuf_tmp_pre_save(void *opaque)
1223 struct sbuf_tmp *tmp = opaque;
1224 tmp->woff = tmp->parent->sb_wptr - tmp->parent->sb_data;
1225 tmp->roff = tmp->parent->sb_rptr - tmp->parent->sb_data;
1230 static int sbuf_tmp_post_load(void *opaque, int version)
1232 struct sbuf_tmp *tmp = opaque;
1233 uint32_t requested_len = tmp->parent->sb_datalen;
1235 /* Allocate the buffer space used by the field after the tmp */
1236 sbreserve(tmp->parent, tmp->parent->sb_datalen);
1238 if (tmp->parent->sb_datalen != requested_len) {
1241 if (tmp->woff >= requested_len ||
1242 tmp->roff >= requested_len) {
1243 error_report("invalid sbuf offsets r/w=%u/%u len=%u",
1244 tmp->roff, tmp->woff, requested_len);
1248 tmp->parent->sb_wptr = tmp->parent->sb_data + tmp->woff;
1249 tmp->parent->sb_rptr = tmp->parent->sb_data + tmp->roff;
1255 static const VMStateDescription vmstate_slirp_sbuf_tmp = {
1256 .name = "slirp-sbuf-tmp",
1257 .post_load = sbuf_tmp_post_load,
1258 .pre_save = sbuf_tmp_pre_save,
1260 .fields = (VMStateField[]) {
1261 VMSTATE_UINT32(woff, struct sbuf_tmp),
1262 VMSTATE_UINT32(roff, struct sbuf_tmp),
1263 VMSTATE_END_OF_LIST()
1267 static const VMStateDescription vmstate_slirp_sbuf = {
1268 .name = "slirp-sbuf",
1270 .fields = (VMStateField[]) {
1271 VMSTATE_UINT32(sb_cc, struct sbuf),
1272 VMSTATE_UINT32(sb_datalen, struct sbuf),
1273 VMSTATE_WITH_TMP(struct sbuf, struct sbuf_tmp, vmstate_slirp_sbuf_tmp),
1274 VMSTATE_VBUFFER_UINT32(sb_data, struct sbuf, 0, NULL, sb_datalen),
1275 VMSTATE_END_OF_LIST()
1279 static bool slirp_older_than_v4(void *opaque, int version_id)
1281 return version_id < 4;
1284 static bool slirp_family_inet(void *opaque, int version_id)
1286 union slirp_sockaddr *ssa = (union slirp_sockaddr *)opaque;
1287 return ssa->ss.ss_family == AF_INET;
1290 static int slirp_socket_pre_load(void *opaque)
1292 struct socket *so = opaque;
1293 if (tcp_attach(so) < 0) {
1296 /* Older versions don't load these fields */
1297 so->so_ffamily = AF_INET;
1298 so->so_lfamily = AF_INET;
1303 #define VMSTATE_SIN4_ADDR(f, s, t) VMSTATE_UINT32_TEST(f, s, t)
1305 /* Win uses u_long rather than uint32_t - but it's still 32bits long */
1306 #define VMSTATE_SIN4_ADDR(f, s, t) VMSTATE_SINGLE_TEST(f, s, t, 0, \
1307 vmstate_info_uint32, u_long)
1310 /* The OS provided ss_family field isn't that portable; it's size
1311 * and type varies (16/8 bit, signed, unsigned)
1312 * and the values it contains aren't fully portable.
1314 typedef struct SS_FamilyTmpStruct {
1315 union slirp_sockaddr *parent;
1316 uint16_t portable_family;
1317 } SS_FamilyTmpStruct;
1319 #define SS_FAMILY_MIG_IPV4 2 /* Linux, BSD, Win... */
1320 #define SS_FAMILY_MIG_IPV6 10 /* Linux */
1321 #define SS_FAMILY_MIG_OTHER 0xffff
1323 static int ss_family_pre_save(void *opaque)
1325 SS_FamilyTmpStruct *tss = opaque;
1327 tss->portable_family = SS_FAMILY_MIG_OTHER;
1329 if (tss->parent->ss.ss_family == AF_INET) {
1330 tss->portable_family = SS_FAMILY_MIG_IPV4;
1331 } else if (tss->parent->ss.ss_family == AF_INET6) {
1332 tss->portable_family = SS_FAMILY_MIG_IPV6;
1338 static int ss_family_post_load(void *opaque, int version_id)
1340 SS_FamilyTmpStruct *tss = opaque;
1342 switch (tss->portable_family) {
1343 case SS_FAMILY_MIG_IPV4:
1344 tss->parent->ss.ss_family = AF_INET;
1346 case SS_FAMILY_MIG_IPV6:
1347 case 23: /* compatibility: AF_INET6 from mingw */
1348 case 28: /* compatibility: AF_INET6 from FreeBSD sys/socket.h */
1349 tss->parent->ss.ss_family = AF_INET6;
1352 error_report("invalid ss_family type %x", tss->portable_family);
1359 static const VMStateDescription vmstate_slirp_ss_family = {
1360 .name = "slirp-socket-addr/ss_family",
1361 .pre_save = ss_family_pre_save,
1362 .post_load = ss_family_post_load,
1363 .fields = (VMStateField[]) {
1364 VMSTATE_UINT16(portable_family, SS_FamilyTmpStruct),
1365 VMSTATE_END_OF_LIST()
1369 static const VMStateDescription vmstate_slirp_socket_addr = {
1370 .name = "slirp-socket-addr",
1372 .fields = (VMStateField[]) {
1373 VMSTATE_WITH_TMP(union slirp_sockaddr, SS_FamilyTmpStruct,
1374 vmstate_slirp_ss_family),
1375 VMSTATE_SIN4_ADDR(sin.sin_addr.s_addr, union slirp_sockaddr,
1377 VMSTATE_UINT16_TEST(sin.sin_port, union slirp_sockaddr,
1381 /* Untested: Needs checking by someone with IPv6 test */
1382 VMSTATE_BUFFER_TEST(sin6.sin6_addr, union slirp_sockaddr,
1383 slirp_family_inet6),
1384 VMSTATE_UINT16_TEST(sin6.sin6_port, union slirp_sockaddr,
1385 slirp_family_inet6),
1386 VMSTATE_UINT32_TEST(sin6.sin6_flowinfo, union slirp_sockaddr,
1387 slirp_family_inet6),
1388 VMSTATE_UINT32_TEST(sin6.sin6_scope_id, union slirp_sockaddr,
1389 slirp_family_inet6),
1392 VMSTATE_END_OF_LIST()
1396 static const VMStateDescription vmstate_slirp_socket = {
1397 .name = "slirp-socket",
1399 .pre_load = slirp_socket_pre_load,
1400 .fields = (VMStateField[]) {
1401 VMSTATE_UINT32(so_urgc, struct socket),
1402 /* Pre-v4 versions */
1403 VMSTATE_SIN4_ADDR(so_faddr.s_addr, struct socket,
1404 slirp_older_than_v4),
1405 VMSTATE_SIN4_ADDR(so_laddr.s_addr, struct socket,
1406 slirp_older_than_v4),
1407 VMSTATE_UINT16_TEST(so_fport, struct socket, slirp_older_than_v4),
1408 VMSTATE_UINT16_TEST(so_lport, struct socket, slirp_older_than_v4),
1410 VMSTATE_STRUCT(fhost, struct socket, 4, vmstate_slirp_socket_addr,
1411 union slirp_sockaddr),
1412 VMSTATE_STRUCT(lhost, struct socket, 4, vmstate_slirp_socket_addr,
1413 union slirp_sockaddr),
1415 VMSTATE_UINT8(so_iptos, struct socket),
1416 VMSTATE_UINT8(so_emu, struct socket),
1417 VMSTATE_UINT8(so_type, struct socket),
1418 VMSTATE_INT32(so_state, struct socket),
1419 VMSTATE_STRUCT(so_rcv, struct socket, 0, vmstate_slirp_sbuf,
1421 VMSTATE_STRUCT(so_snd, struct socket, 0, vmstate_slirp_sbuf,
1423 VMSTATE_STRUCT_POINTER(so_tcpcb, struct socket, vmstate_slirp_tcp,
1425 VMSTATE_END_OF_LIST()
1429 static const VMStateDescription vmstate_slirp_bootp_client = {
1430 .name = "slirp_bootpclient",
1431 .fields = (VMStateField[]) {
1432 VMSTATE_UINT16(allocated, BOOTPClient),
1433 VMSTATE_BUFFER(macaddr, BOOTPClient),
1434 VMSTATE_END_OF_LIST()
1438 static const VMStateDescription vmstate_slirp = {
1441 .fields = (VMStateField[]) {
1442 VMSTATE_UINT16_V(ip_id, Slirp, 2),
1443 VMSTATE_STRUCT_ARRAY(bootp_clients, Slirp, NB_BOOTP_CLIENTS, 3,
1444 vmstate_slirp_bootp_client, BOOTPClient),
1445 VMSTATE_END_OF_LIST()
1449 static void slirp_state_save(QEMUFile *f, void *opaque)
1451 Slirp *slirp = opaque;
1452 struct ex_list *ex_ptr;
1454 for (ex_ptr = slirp->exec_list; ex_ptr; ex_ptr = ex_ptr->ex_next)
1455 if (ex_ptr->ex_pty == 3) {
1457 so = slirp_find_ctl_socket(slirp, ex_ptr->ex_addr,
1458 ntohs(ex_ptr->ex_fport));
1462 qemu_put_byte(f, 42);
1463 vmstate_save_state(f, &vmstate_slirp_socket, so, NULL);
1465 qemu_put_byte(f, 0);
1467 vmstate_save_state(f, &vmstate_slirp, slirp, NULL);
1471 static int slirp_state_load(QEMUFile *f, void *opaque, int version_id)
1473 Slirp *slirp = opaque;
1474 struct ex_list *ex_ptr;
1476 while (qemu_get_byte(f)) {
1478 struct socket *so = socreate(slirp);
1480 ret = vmstate_load_state(f, &vmstate_slirp_socket, so, version_id);
1485 if ((so->so_faddr.s_addr & slirp->vnetwork_mask.s_addr) !=
1486 slirp->vnetwork_addr.s_addr) {
1489 for (ex_ptr = slirp->exec_list; ex_ptr; ex_ptr = ex_ptr->ex_next) {
1490 if (ex_ptr->ex_pty == 3 &&
1491 so->so_faddr.s_addr == ex_ptr->ex_addr.s_addr &&
1492 so->so_fport == ex_ptr->ex_fport) {
1499 so->extra = (void *)ex_ptr->ex_exec;
1502 return vmstate_load_state(f, &vmstate_slirp, slirp, version_id);