lib/tsocket: add tdgram_bsd_existing_socket() helper function
[Samba.git] / lib / tsocket / tsocket_bsd.c
blob9ddbc061b94bf7db9ae999068f15edc406739857
1 /*
2 Unix SMB/CIFS implementation.
4 Copyright (C) Stefan Metzmacher 2009
6 ** NOTE! The following LGPL license applies to the tsocket
7 ** library. This does NOT imply that all of Samba is released
8 ** under the LGPL
10 This library is free software; you can redistribute it and/or
11 modify it under the terms of the GNU Lesser General Public
12 License as published by the Free Software Foundation; either
13 version 3 of the License, or (at your option) any later version.
15 This library is distributed in the hope that it will be useful,
16 but WITHOUT ANY WARRANTY; without even the implied warranty of
17 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
18 Lesser General Public License for more details.
20 You should have received a copy of the GNU Lesser General Public
21 License along with this library; if not, see <http://www.gnu.org/licenses/>.
24 #include "replace.h"
25 #include "system/filesys.h"
26 #include "system/network.h"
27 #include "tsocket.h"
28 #include "tsocket_internal.h"
29 #include "lib/util/iov_buf.h"
30 #include "lib/util/blocking.h"
32 static int tsocket_bsd_error_from_errno(int ret,
33 int sys_errno,
34 bool *retry)
36 *retry = false;
38 if (ret >= 0) {
39 return 0;
42 if (ret != -1) {
43 return EIO;
46 if (sys_errno == 0) {
47 return EIO;
50 if (sys_errno == EINTR) {
51 *retry = true;
52 return sys_errno;
55 if (sys_errno == EINPROGRESS) {
56 *retry = true;
57 return sys_errno;
60 if (sys_errno == EAGAIN) {
61 *retry = true;
62 return sys_errno;
65 /* ENOMEM is retryable on Solaris/illumos, and possibly other systems. */
66 if (sys_errno == ENOMEM) {
67 *retry = true;
68 return sys_errno;
71 #ifdef EWOULDBLOCK
72 if (sys_errno == EWOULDBLOCK) {
73 *retry = true;
74 return sys_errno;
76 #endif
78 return sys_errno;
81 static int tsocket_bsd_common_prepare_fd(int fd, bool high_fd)
83 int i;
84 int sys_errno = 0;
85 int fds[3];
86 int num_fds = 0;
88 int result;
89 bool ok;
91 if (fd == -1) {
92 return -1;
95 /* first make a fd >= 3 */
96 if (high_fd) {
97 while (fd < 3) {
98 fds[num_fds++] = fd;
99 fd = dup(fd);
100 if (fd == -1) {
101 sys_errno = errno;
102 break;
105 for (i=0; i<num_fds; i++) {
106 close(fds[i]);
108 if (fd == -1) {
109 errno = sys_errno;
110 return fd;
114 result = set_blocking(fd, false);
115 if (result == -1) {
116 goto fail;
119 ok = smb_set_close_on_exec(fd);
120 if (!ok) {
121 goto fail;
124 return fd;
126 fail:
127 if (fd != -1) {
128 sys_errno = errno;
129 close(fd);
130 errno = sys_errno;
132 return -1;
135 static ssize_t tsocket_bsd_pending(int fd)
137 int ret, error;
138 int value = 0;
139 socklen_t len;
141 ret = ioctl(fd, FIONREAD, &value);
142 if (ret == -1) {
143 return ret;
146 if (ret != 0) {
147 /* this should not be reached */
148 errno = EIO;
149 return -1;
152 if (value != 0) {
153 return value;
156 error = 0;
157 len = sizeof(error);
160 * if no data is available check if the socket is in error state. For
161 * dgram sockets it's the way to return ICMP error messages of
162 * connected sockets to the caller.
164 ret = getsockopt(fd, SOL_SOCKET, SO_ERROR, &error, &len);
165 if (ret == -1) {
166 return ret;
168 if (error != 0) {
169 errno = error;
170 return -1;
172 return 0;
175 static const struct tsocket_address_ops tsocket_address_bsd_ops;
177 struct tsocket_address_bsd {
178 socklen_t sa_socklen;
179 union {
180 struct sockaddr sa;
181 struct sockaddr_in in;
182 #ifdef HAVE_IPV6
183 struct sockaddr_in6 in6;
184 #endif
185 struct sockaddr_un un;
186 struct sockaddr_storage ss;
187 } u;
190 int _tsocket_address_bsd_from_sockaddr(TALLOC_CTX *mem_ctx,
191 const struct sockaddr *sa,
192 size_t sa_socklen,
193 struct tsocket_address **_addr,
194 const char *location)
196 struct tsocket_address *addr;
197 struct tsocket_address_bsd *bsda;
199 if (sa_socklen < sizeof(sa->sa_family)) {
200 errno = EINVAL;
201 return -1;
204 switch (sa->sa_family) {
205 case AF_UNIX:
206 if (sa_socklen > sizeof(struct sockaddr_un)) {
207 sa_socklen = sizeof(struct sockaddr_un);
209 break;
210 case AF_INET:
211 if (sa_socklen < sizeof(struct sockaddr_in)) {
212 errno = EINVAL;
213 return -1;
215 sa_socklen = sizeof(struct sockaddr_in);
216 break;
217 #ifdef HAVE_IPV6
218 case AF_INET6:
219 if (sa_socklen < sizeof(struct sockaddr_in6)) {
220 errno = EINVAL;
221 return -1;
223 sa_socklen = sizeof(struct sockaddr_in6);
224 break;
225 #endif
226 default:
227 errno = EAFNOSUPPORT;
228 return -1;
231 if (sa_socklen > sizeof(struct sockaddr_storage)) {
232 errno = EINVAL;
233 return -1;
236 addr = tsocket_address_create(mem_ctx,
237 &tsocket_address_bsd_ops,
238 &bsda,
239 struct tsocket_address_bsd,
240 location);
241 if (!addr) {
242 errno = ENOMEM;
243 return -1;
246 ZERO_STRUCTP(bsda);
248 memcpy(&bsda->u.ss, sa, sa_socklen);
250 bsda->sa_socklen = sa_socklen;
251 #ifdef HAVE_STRUCT_SOCKADDR_SA_LEN
252 bsda->u.sa.sa_len = bsda->sa_socklen;
253 #endif
255 *_addr = addr;
256 return 0;
259 ssize_t tsocket_address_bsd_sockaddr(const struct tsocket_address *addr,
260 struct sockaddr *sa,
261 size_t sa_socklen)
263 struct tsocket_address_bsd *bsda = talloc_get_type(addr->private_data,
264 struct tsocket_address_bsd);
266 if (!bsda) {
267 errno = EINVAL;
268 return -1;
271 if (sa_socklen < bsda->sa_socklen) {
272 errno = EINVAL;
273 return -1;
276 if (sa_socklen > bsda->sa_socklen) {
277 memset(sa, 0, sa_socklen);
278 sa_socklen = bsda->sa_socklen;
281 memcpy(sa, &bsda->u.ss, sa_socklen);
282 #ifdef HAVE_STRUCT_SOCKADDR_SA_LEN
283 sa->sa_len = sa_socklen;
284 #endif
285 return sa_socklen;
288 bool tsocket_address_is_inet(const struct tsocket_address *addr, const char *fam)
290 struct tsocket_address_bsd *bsda = talloc_get_type(addr->private_data,
291 struct tsocket_address_bsd);
293 if (!bsda) {
294 return false;
297 switch (bsda->u.sa.sa_family) {
298 case AF_INET:
299 if (strcasecmp(fam, "ip") == 0) {
300 return true;
303 if (strcasecmp(fam, "ipv4") == 0) {
304 return true;
307 return false;
308 #ifdef HAVE_IPV6
309 case AF_INET6:
310 if (strcasecmp(fam, "ip") == 0) {
311 return true;
314 if (strcasecmp(fam, "ipv6") == 0) {
315 return true;
318 return false;
319 #endif
322 return false;
325 int _tsocket_address_inet_from_strings(TALLOC_CTX *mem_ctx,
326 const char *fam,
327 const char *addr,
328 uint16_t port,
329 struct tsocket_address **_addr,
330 const char *location)
332 struct addrinfo hints;
333 struct addrinfo *result = NULL;
334 char port_str[6];
335 int ret;
337 ZERO_STRUCT(hints);
339 * we use SOCKET_STREAM here to get just one result
340 * back from getaddrinfo().
342 hints.ai_socktype = SOCK_STREAM;
343 hints.ai_flags = AI_NUMERICHOST | AI_NUMERICSERV;
345 if (strcasecmp(fam, "ip") == 0) {
346 hints.ai_family = AF_UNSPEC;
347 if (!addr) {
348 #ifdef HAVE_IPV6
349 addr = "::";
350 #else
351 addr = "0.0.0.0";
352 #endif
354 } else if (strcasecmp(fam, "ipv4") == 0) {
355 hints.ai_family = AF_INET;
356 if (!addr) {
357 addr = "0.0.0.0";
359 #ifdef HAVE_IPV6
360 } else if (strcasecmp(fam, "ipv6") == 0) {
361 hints.ai_family = AF_INET6;
362 if (!addr) {
363 addr = "::";
365 #endif
366 } else {
367 errno = EAFNOSUPPORT;
368 return -1;
371 snprintf(port_str, sizeof(port_str), "%u", port);
373 ret = getaddrinfo(addr, port_str, &hints, &result);
374 if (ret != 0) {
375 switch (ret) {
376 case EAI_FAIL:
377 errno = EINVAL;
378 break;
380 ret = -1;
381 goto done;
384 if (result->ai_socktype != SOCK_STREAM) {
385 errno = EINVAL;
386 ret = -1;
387 goto done;
390 ret = _tsocket_address_bsd_from_sockaddr(mem_ctx,
391 result->ai_addr,
392 result->ai_addrlen,
393 _addr,
394 location);
396 done:
397 if (result) {
398 freeaddrinfo(result);
400 return ret;
403 char *tsocket_address_inet_addr_string(const struct tsocket_address *addr,
404 TALLOC_CTX *mem_ctx)
406 struct tsocket_address_bsd *bsda = talloc_get_type(addr->private_data,
407 struct tsocket_address_bsd);
408 char addr_str[INET6_ADDRSTRLEN+1];
409 const char *str;
411 if (!bsda) {
412 errno = EINVAL;
413 return NULL;
416 switch (bsda->u.sa.sa_family) {
417 case AF_INET:
418 str = inet_ntop(bsda->u.in.sin_family,
419 &bsda->u.in.sin_addr,
420 addr_str, sizeof(addr_str));
421 break;
422 #ifdef HAVE_IPV6
423 case AF_INET6:
424 str = inet_ntop(bsda->u.in6.sin6_family,
425 &bsda->u.in6.sin6_addr,
426 addr_str, sizeof(addr_str));
427 break;
428 #endif
429 default:
430 errno = EINVAL;
431 return NULL;
434 if (!str) {
435 return NULL;
438 return talloc_strdup(mem_ctx, str);
441 uint16_t tsocket_address_inet_port(const struct tsocket_address *addr)
443 struct tsocket_address_bsd *bsda = talloc_get_type(addr->private_data,
444 struct tsocket_address_bsd);
445 uint16_t port = 0;
447 if (!bsda) {
448 errno = EINVAL;
449 return 0;
452 switch (bsda->u.sa.sa_family) {
453 case AF_INET:
454 port = ntohs(bsda->u.in.sin_port);
455 break;
456 #ifdef HAVE_IPV6
457 case AF_INET6:
458 port = ntohs(bsda->u.in6.sin6_port);
459 break;
460 #endif
461 default:
462 errno = EINVAL;
463 return 0;
466 return port;
469 int tsocket_address_inet_set_port(struct tsocket_address *addr,
470 uint16_t port)
472 struct tsocket_address_bsd *bsda = talloc_get_type(addr->private_data,
473 struct tsocket_address_bsd);
475 if (!bsda) {
476 errno = EINVAL;
477 return -1;
480 switch (bsda->u.sa.sa_family) {
481 case AF_INET:
482 bsda->u.in.sin_port = htons(port);
483 break;
484 #ifdef HAVE_IPV6
485 case AF_INET6:
486 bsda->u.in6.sin6_port = htons(port);
487 break;
488 #endif
489 default:
490 errno = EINVAL;
491 return -1;
494 return 0;
497 bool tsocket_address_is_unix(const struct tsocket_address *addr)
499 struct tsocket_address_bsd *bsda = talloc_get_type(addr->private_data,
500 struct tsocket_address_bsd);
502 if (!bsda) {
503 return false;
506 switch (bsda->u.sa.sa_family) {
507 case AF_UNIX:
508 return true;
511 return false;
514 int _tsocket_address_unix_from_path(TALLOC_CTX *mem_ctx,
515 const char *path,
516 struct tsocket_address **_addr,
517 const char *location)
519 struct sockaddr_un un;
520 void *p = &un;
521 int ret;
523 if (!path) {
524 path = "";
527 if (strlen(path) > sizeof(un.sun_path)-1) {
528 errno = ENAMETOOLONG;
529 return -1;
532 ZERO_STRUCT(un);
533 un.sun_family = AF_UNIX;
534 strncpy(un.sun_path, path, sizeof(un.sun_path)-1);
536 ret = _tsocket_address_bsd_from_sockaddr(mem_ctx,
537 (struct sockaddr *)p,
538 sizeof(un),
539 _addr,
540 location);
542 return ret;
545 char *tsocket_address_unix_path(const struct tsocket_address *addr,
546 TALLOC_CTX *mem_ctx)
548 struct tsocket_address_bsd *bsda = talloc_get_type(addr->private_data,
549 struct tsocket_address_bsd);
550 const char *str;
552 if (!bsda) {
553 errno = EINVAL;
554 return NULL;
557 switch (bsda->u.sa.sa_family) {
558 case AF_UNIX:
559 str = bsda->u.un.sun_path;
560 break;
561 default:
562 errno = EINVAL;
563 return NULL;
566 return talloc_strdup(mem_ctx, str);
569 static char *tsocket_address_bsd_string(const struct tsocket_address *addr,
570 TALLOC_CTX *mem_ctx)
572 struct tsocket_address_bsd *bsda = talloc_get_type(addr->private_data,
573 struct tsocket_address_bsd);
574 char *str;
575 char *addr_str;
576 const char *prefix = NULL;
577 uint16_t port;
579 switch (bsda->u.sa.sa_family) {
580 case AF_UNIX:
581 return talloc_asprintf(mem_ctx, "unix:%s",
582 bsda->u.un.sun_path);
583 case AF_INET:
584 prefix = "ipv4";
585 break;
586 #ifdef HAVE_IPV6
587 case AF_INET6:
588 prefix = "ipv6";
589 break;
590 #endif
591 default:
592 errno = EINVAL;
593 return NULL;
596 addr_str = tsocket_address_inet_addr_string(addr, mem_ctx);
597 if (!addr_str) {
598 return NULL;
601 port = tsocket_address_inet_port(addr);
603 str = talloc_asprintf(mem_ctx, "%s:%s:%u",
604 prefix, addr_str, port);
605 talloc_free(addr_str);
607 return str;
610 static struct tsocket_address *tsocket_address_bsd_copy(const struct tsocket_address *addr,
611 TALLOC_CTX *mem_ctx,
612 const char *location)
614 struct tsocket_address_bsd *bsda = talloc_get_type(addr->private_data,
615 struct tsocket_address_bsd);
616 struct tsocket_address *copy;
617 int ret;
619 ret = _tsocket_address_bsd_from_sockaddr(mem_ctx,
620 &bsda->u.sa,
621 bsda->sa_socklen,
622 &copy,
623 location);
624 if (ret != 0) {
625 return NULL;
628 return copy;
631 static const struct tsocket_address_ops tsocket_address_bsd_ops = {
632 .name = "bsd",
633 .string = tsocket_address_bsd_string,
634 .copy = tsocket_address_bsd_copy,
637 struct tdgram_bsd {
638 int fd;
640 void *event_ptr;
641 struct tevent_fd *fde;
642 bool optimize_recvfrom;
644 void *readable_private;
645 void (*readable_handler)(void *private_data);
646 void *writeable_private;
647 void (*writeable_handler)(void *private_data);
650 bool tdgram_bsd_optimize_recvfrom(struct tdgram_context *dgram,
651 bool on)
653 struct tdgram_bsd *bsds =
654 talloc_get_type(_tdgram_context_data(dgram),
655 struct tdgram_bsd);
656 bool old;
658 if (bsds == NULL) {
659 /* not a bsd socket */
660 return false;
663 old = bsds->optimize_recvfrom;
664 bsds->optimize_recvfrom = on;
666 return old;
669 static void tdgram_bsd_fde_handler(struct tevent_context *ev,
670 struct tevent_fd *fde,
671 uint16_t flags,
672 void *private_data)
674 struct tdgram_bsd *bsds = talloc_get_type_abort(private_data,
675 struct tdgram_bsd);
677 if (flags & TEVENT_FD_WRITE) {
678 bsds->writeable_handler(bsds->writeable_private);
679 return;
681 if (flags & TEVENT_FD_READ) {
682 if (!bsds->readable_handler) {
683 TEVENT_FD_NOT_READABLE(bsds->fde);
684 return;
686 bsds->readable_handler(bsds->readable_private);
687 return;
691 static int tdgram_bsd_set_readable_handler(struct tdgram_bsd *bsds,
692 struct tevent_context *ev,
693 void (*handler)(void *private_data),
694 void *private_data)
696 if (ev == NULL) {
697 if (handler) {
698 errno = EINVAL;
699 return -1;
701 if (!bsds->readable_handler) {
702 return 0;
704 bsds->readable_handler = NULL;
705 bsds->readable_private = NULL;
707 return 0;
710 /* read and write must use the same tevent_context */
711 if (bsds->event_ptr != ev) {
712 if (bsds->readable_handler || bsds->writeable_handler) {
713 errno = EINVAL;
714 return -1;
716 bsds->event_ptr = NULL;
717 TALLOC_FREE(bsds->fde);
720 if (tevent_fd_get_flags(bsds->fde) == 0) {
721 TALLOC_FREE(bsds->fde);
723 bsds->fde = tevent_add_fd(ev, bsds,
724 bsds->fd, TEVENT_FD_READ,
725 tdgram_bsd_fde_handler,
726 bsds);
727 if (!bsds->fde) {
728 errno = ENOMEM;
729 return -1;
732 /* cache the event context we're running on */
733 bsds->event_ptr = ev;
734 } else if (!bsds->readable_handler) {
735 TEVENT_FD_READABLE(bsds->fde);
738 bsds->readable_handler = handler;
739 bsds->readable_private = private_data;
741 return 0;
744 static int tdgram_bsd_set_writeable_handler(struct tdgram_bsd *bsds,
745 struct tevent_context *ev,
746 void (*handler)(void *private_data),
747 void *private_data)
749 if (ev == NULL) {
750 if (handler) {
751 errno = EINVAL;
752 return -1;
754 if (!bsds->writeable_handler) {
755 return 0;
757 bsds->writeable_handler = NULL;
758 bsds->writeable_private = NULL;
759 TEVENT_FD_NOT_WRITEABLE(bsds->fde);
761 return 0;
764 /* read and write must use the same tevent_context */
765 if (bsds->event_ptr != ev) {
766 if (bsds->readable_handler || bsds->writeable_handler) {
767 errno = EINVAL;
768 return -1;
770 bsds->event_ptr = NULL;
771 TALLOC_FREE(bsds->fde);
774 if (tevent_fd_get_flags(bsds->fde) == 0) {
775 TALLOC_FREE(bsds->fde);
777 bsds->fde = tevent_add_fd(ev, bsds,
778 bsds->fd, TEVENT_FD_WRITE,
779 tdgram_bsd_fde_handler,
780 bsds);
781 if (!bsds->fde) {
782 errno = ENOMEM;
783 return -1;
786 /* cache the event context we're running on */
787 bsds->event_ptr = ev;
788 } else if (!bsds->writeable_handler) {
789 TEVENT_FD_WRITEABLE(bsds->fde);
792 bsds->writeable_handler = handler;
793 bsds->writeable_private = private_data;
795 return 0;
798 struct tdgram_bsd_recvfrom_state {
799 struct tdgram_context *dgram;
800 bool first_try;
801 uint8_t *buf;
802 size_t len;
803 struct tsocket_address *src;
806 static int tdgram_bsd_recvfrom_destructor(struct tdgram_bsd_recvfrom_state *state)
808 struct tdgram_bsd *bsds = tdgram_context_data(state->dgram,
809 struct tdgram_bsd);
811 tdgram_bsd_set_readable_handler(bsds, NULL, NULL, NULL);
813 return 0;
816 static void tdgram_bsd_recvfrom_handler(void *private_data);
818 static struct tevent_req *tdgram_bsd_recvfrom_send(TALLOC_CTX *mem_ctx,
819 struct tevent_context *ev,
820 struct tdgram_context *dgram)
822 struct tevent_req *req;
823 struct tdgram_bsd_recvfrom_state *state;
824 struct tdgram_bsd *bsds = tdgram_context_data(dgram, struct tdgram_bsd);
825 int ret;
827 req = tevent_req_create(mem_ctx, &state,
828 struct tdgram_bsd_recvfrom_state);
829 if (!req) {
830 return NULL;
833 state->dgram = dgram;
834 state->first_try= true;
835 state->buf = NULL;
836 state->len = 0;
837 state->src = NULL;
839 talloc_set_destructor(state, tdgram_bsd_recvfrom_destructor);
841 if (bsds->fd == -1) {
842 tevent_req_error(req, ENOTCONN);
843 goto post;
848 * this is a fast path, not waiting for the
849 * socket to become explicit readable gains
850 * about 10%-20% performance in benchmark tests.
852 if (bsds->optimize_recvfrom) {
854 * We only do the optimization on
855 * recvfrom if the caller asked for it.
857 * This is needed because in most cases
858 * we preferr to flush send buffers before
859 * receiving incoming requests.
861 tdgram_bsd_recvfrom_handler(req);
862 if (!tevent_req_is_in_progress(req)) {
863 goto post;
867 ret = tdgram_bsd_set_readable_handler(bsds, ev,
868 tdgram_bsd_recvfrom_handler,
869 req);
870 if (ret == -1) {
871 tevent_req_error(req, errno);
872 goto post;
875 return req;
877 post:
878 tevent_req_post(req, ev);
879 return req;
882 static void tdgram_bsd_recvfrom_handler(void *private_data)
884 struct tevent_req *req = talloc_get_type_abort(private_data,
885 struct tevent_req);
886 struct tdgram_bsd_recvfrom_state *state = tevent_req_data(req,
887 struct tdgram_bsd_recvfrom_state);
888 struct tdgram_context *dgram = state->dgram;
889 struct tdgram_bsd *bsds = tdgram_context_data(dgram, struct tdgram_bsd);
890 struct tsocket_address_bsd *bsda;
891 ssize_t ret;
892 int err;
893 bool retry;
895 ret = tsocket_bsd_pending(bsds->fd);
896 if (state->first_try && ret == 0) {
897 state->first_try = false;
898 /* retry later */
899 return;
901 state->first_try = false;
903 err = tsocket_bsd_error_from_errno(ret, errno, &retry);
904 if (retry) {
905 /* retry later */
906 return;
908 if (tevent_req_error(req, err)) {
909 return;
912 /* note that 'ret' can be 0 here */
913 state->buf = talloc_array(state, uint8_t, ret);
914 if (tevent_req_nomem(state->buf, req)) {
915 return;
917 state->len = ret;
919 state->src = tsocket_address_create(state,
920 &tsocket_address_bsd_ops,
921 &bsda,
922 struct tsocket_address_bsd,
923 __location__ "bsd_recvfrom");
924 if (tevent_req_nomem(state->src, req)) {
925 return;
928 ZERO_STRUCTP(bsda);
929 bsda->sa_socklen = sizeof(bsda->u.ss);
930 #ifdef HAVE_STRUCT_SOCKADDR_SA_LEN
931 bsda->u.sa.sa_len = bsda->sa_socklen;
932 #endif
934 ret = recvfrom(bsds->fd, state->buf, state->len, 0,
935 &bsda->u.sa, &bsda->sa_socklen);
936 err = tsocket_bsd_error_from_errno(ret, errno, &retry);
937 if (retry) {
938 /* retry later */
939 return;
941 if (tevent_req_error(req, err)) {
942 return;
946 * Some systems (FreeBSD, see bug #7115) return too much
947 * bytes in tsocket_bsd_pending()/ioctl(fd, FIONREAD, ...),
948 * the return value includes some IP/UDP header bytes,
949 * while recvfrom() just returns the payload.
951 state->buf = talloc_realloc(state, state->buf, uint8_t, ret);
952 if (tevent_req_nomem(state->buf, req)) {
953 return;
955 state->len = ret;
957 tevent_req_done(req);
960 static ssize_t tdgram_bsd_recvfrom_recv(struct tevent_req *req,
961 int *perrno,
962 TALLOC_CTX *mem_ctx,
963 uint8_t **buf,
964 struct tsocket_address **src)
966 struct tdgram_bsd_recvfrom_state *state = tevent_req_data(req,
967 struct tdgram_bsd_recvfrom_state);
968 ssize_t ret;
970 ret = tsocket_simple_int_recv(req, perrno);
971 if (ret == 0) {
972 *buf = talloc_move(mem_ctx, &state->buf);
973 ret = state->len;
974 if (src) {
975 *src = talloc_move(mem_ctx, &state->src);
979 tevent_req_received(req);
980 return ret;
983 struct tdgram_bsd_sendto_state {
984 struct tdgram_context *dgram;
986 const uint8_t *buf;
987 size_t len;
988 const struct tsocket_address *dst;
990 ssize_t ret;
993 static int tdgram_bsd_sendto_destructor(struct tdgram_bsd_sendto_state *state)
995 struct tdgram_bsd *bsds = tdgram_context_data(state->dgram,
996 struct tdgram_bsd);
998 tdgram_bsd_set_writeable_handler(bsds, NULL, NULL, NULL);
1000 return 0;
1003 static void tdgram_bsd_sendto_handler(void *private_data);
1005 static struct tevent_req *tdgram_bsd_sendto_send(TALLOC_CTX *mem_ctx,
1006 struct tevent_context *ev,
1007 struct tdgram_context *dgram,
1008 const uint8_t *buf,
1009 size_t len,
1010 const struct tsocket_address *dst)
1012 struct tevent_req *req;
1013 struct tdgram_bsd_sendto_state *state;
1014 struct tdgram_bsd *bsds = tdgram_context_data(dgram, struct tdgram_bsd);
1015 int ret;
1017 req = tevent_req_create(mem_ctx, &state,
1018 struct tdgram_bsd_sendto_state);
1019 if (!req) {
1020 return NULL;
1023 state->dgram = dgram;
1024 state->buf = buf;
1025 state->len = len;
1026 state->dst = dst;
1027 state->ret = -1;
1029 talloc_set_destructor(state, tdgram_bsd_sendto_destructor);
1031 if (bsds->fd == -1) {
1032 tevent_req_error(req, ENOTCONN);
1033 goto post;
1037 * this is a fast path, not waiting for the
1038 * socket to become explicit writeable gains
1039 * about 10%-20% performance in benchmark tests.
1041 tdgram_bsd_sendto_handler(req);
1042 if (!tevent_req_is_in_progress(req)) {
1043 goto post;
1046 ret = tdgram_bsd_set_writeable_handler(bsds, ev,
1047 tdgram_bsd_sendto_handler,
1048 req);
1049 if (ret == -1) {
1050 tevent_req_error(req, errno);
1051 goto post;
1054 return req;
1056 post:
1057 tevent_req_post(req, ev);
1058 return req;
1061 static void tdgram_bsd_sendto_handler(void *private_data)
1063 struct tevent_req *req = talloc_get_type_abort(private_data,
1064 struct tevent_req);
1065 struct tdgram_bsd_sendto_state *state = tevent_req_data(req,
1066 struct tdgram_bsd_sendto_state);
1067 struct tdgram_context *dgram = state->dgram;
1068 struct tdgram_bsd *bsds = tdgram_context_data(dgram, struct tdgram_bsd);
1069 struct sockaddr *sa = NULL;
1070 socklen_t sa_socklen = 0;
1071 ssize_t ret;
1072 int err;
1073 bool retry;
1075 if (state->dst) {
1076 struct tsocket_address_bsd *bsda =
1077 talloc_get_type(state->dst->private_data,
1078 struct tsocket_address_bsd);
1080 sa = &bsda->u.sa;
1081 sa_socklen = bsda->sa_socklen;
1084 ret = sendto(bsds->fd, state->buf, state->len, 0, sa, sa_socklen);
1085 err = tsocket_bsd_error_from_errno(ret, errno, &retry);
1086 if (retry) {
1087 /* retry later */
1088 return;
1091 if (err == EMSGSIZE) {
1092 /* round up in 1K increments */
1093 int bufsize = ((state->len + 1023) & (~1023));
1095 ret = setsockopt(bsds->fd, SOL_SOCKET, SO_SNDBUF, &bufsize,
1096 sizeof(bufsize));
1097 if (ret == 0) {
1099 * We do the retry here, rather then via the
1100 * handler, as we only want to retry once for
1101 * this condition, so if there is a mismatch
1102 * between what setsockopt() accepts and what can
1103 * actually be sent, we do not end up in a
1104 * loop.
1107 ret = sendto(bsds->fd, state->buf, state->len,
1108 0, sa, sa_socklen);
1109 err = tsocket_bsd_error_from_errno(ret, errno, &retry);
1110 if (retry) { /* retry later */
1111 return;
1116 if (tevent_req_error(req, err)) {
1117 return;
1120 state->ret = ret;
1122 tevent_req_done(req);
1125 static ssize_t tdgram_bsd_sendto_recv(struct tevent_req *req, int *perrno)
1127 struct tdgram_bsd_sendto_state *state = tevent_req_data(req,
1128 struct tdgram_bsd_sendto_state);
1129 ssize_t ret;
1131 ret = tsocket_simple_int_recv(req, perrno);
1132 if (ret == 0) {
1133 ret = state->ret;
1136 tevent_req_received(req);
1137 return ret;
1140 struct tdgram_bsd_disconnect_state {
1141 uint8_t __dummy;
1144 static struct tevent_req *tdgram_bsd_disconnect_send(TALLOC_CTX *mem_ctx,
1145 struct tevent_context *ev,
1146 struct tdgram_context *dgram)
1148 struct tdgram_bsd *bsds = tdgram_context_data(dgram, struct tdgram_bsd);
1149 struct tevent_req *req;
1150 struct tdgram_bsd_disconnect_state *state;
1151 int ret;
1152 int err;
1153 bool dummy;
1155 req = tevent_req_create(mem_ctx, &state,
1156 struct tdgram_bsd_disconnect_state);
1157 if (req == NULL) {
1158 return NULL;
1161 if (bsds->fd == -1) {
1162 tevent_req_error(req, ENOTCONN);
1163 goto post;
1166 TALLOC_FREE(bsds->fde);
1167 ret = close(bsds->fd);
1168 bsds->fd = -1;
1169 err = tsocket_bsd_error_from_errno(ret, errno, &dummy);
1170 if (tevent_req_error(req, err)) {
1171 goto post;
1174 tevent_req_done(req);
1175 post:
1176 tevent_req_post(req, ev);
1177 return req;
1180 static int tdgram_bsd_disconnect_recv(struct tevent_req *req,
1181 int *perrno)
1183 int ret;
1185 ret = tsocket_simple_int_recv(req, perrno);
1187 tevent_req_received(req);
1188 return ret;
1191 static const struct tdgram_context_ops tdgram_bsd_ops = {
1192 .name = "bsd",
1194 .recvfrom_send = tdgram_bsd_recvfrom_send,
1195 .recvfrom_recv = tdgram_bsd_recvfrom_recv,
1197 .sendto_send = tdgram_bsd_sendto_send,
1198 .sendto_recv = tdgram_bsd_sendto_recv,
1200 .disconnect_send = tdgram_bsd_disconnect_send,
1201 .disconnect_recv = tdgram_bsd_disconnect_recv,
1204 static int tdgram_bsd_destructor(struct tdgram_bsd *bsds)
1206 TALLOC_FREE(bsds->fde);
1207 if (bsds->fd != -1) {
1208 close(bsds->fd);
1209 bsds->fd = -1;
1211 return 0;
1214 static int tdgram_bsd_dgram_socket(const struct tsocket_address *local,
1215 const struct tsocket_address *remote,
1216 bool broadcast,
1217 TALLOC_CTX *mem_ctx,
1218 struct tdgram_context **_dgram,
1219 const char *location)
1221 struct tsocket_address_bsd *lbsda =
1222 talloc_get_type_abort(local->private_data,
1223 struct tsocket_address_bsd);
1224 struct tsocket_address_bsd *rbsda = NULL;
1225 struct tdgram_context *dgram;
1226 struct tdgram_bsd *bsds;
1227 int fd;
1228 int ret;
1229 bool do_bind = false;
1230 bool do_reuseaddr = false;
1231 bool do_ipv6only = false;
1232 bool is_inet = false;
1233 int sa_fam = lbsda->u.sa.sa_family;
1235 if (remote) {
1236 rbsda = talloc_get_type_abort(remote->private_data,
1237 struct tsocket_address_bsd);
1240 switch (lbsda->u.sa.sa_family) {
1241 case AF_UNIX:
1242 if (broadcast) {
1243 errno = EINVAL;
1244 return -1;
1246 if (lbsda->u.un.sun_path[0] != 0) {
1247 do_reuseaddr = true;
1248 do_bind = true;
1250 break;
1251 case AF_INET:
1252 if (lbsda->u.in.sin_port != 0) {
1253 do_reuseaddr = true;
1254 do_bind = true;
1256 if (lbsda->u.in.sin_addr.s_addr != INADDR_ANY) {
1257 do_bind = true;
1259 is_inet = true;
1260 break;
1261 #ifdef HAVE_IPV6
1262 case AF_INET6:
1263 if (lbsda->u.in6.sin6_port != 0) {
1264 do_reuseaddr = true;
1265 do_bind = true;
1267 if (memcmp(&in6addr_any,
1268 &lbsda->u.in6.sin6_addr,
1269 sizeof(in6addr_any)) != 0) {
1270 do_bind = true;
1272 is_inet = true;
1273 do_ipv6only = true;
1274 break;
1275 #endif
1276 default:
1277 errno = EINVAL;
1278 return -1;
1281 if (!do_bind && is_inet && rbsda) {
1282 sa_fam = rbsda->u.sa.sa_family;
1283 switch (sa_fam) {
1284 case AF_INET:
1285 do_ipv6only = false;
1286 break;
1287 #ifdef HAVE_IPV6
1288 case AF_INET6:
1289 do_ipv6only = true;
1290 break;
1291 #endif
1295 fd = socket(sa_fam, SOCK_DGRAM, 0);
1296 if (fd < 0) {
1297 return -1;
1300 fd = tsocket_bsd_common_prepare_fd(fd, true);
1301 if (fd < 0) {
1302 return -1;
1305 dgram = tdgram_context_create(mem_ctx,
1306 &tdgram_bsd_ops,
1307 &bsds,
1308 struct tdgram_bsd,
1309 location);
1310 if (!dgram) {
1311 int saved_errno = errno;
1312 close(fd);
1313 errno = saved_errno;
1314 return -1;
1316 ZERO_STRUCTP(bsds);
1317 bsds->fd = fd;
1318 talloc_set_destructor(bsds, tdgram_bsd_destructor);
1320 #ifdef HAVE_IPV6
1321 if (do_ipv6only) {
1322 int val = 1;
1324 ret = setsockopt(fd, IPPROTO_IPV6, IPV6_V6ONLY,
1325 (const void *)&val, sizeof(val));
1326 if (ret == -1) {
1327 int saved_errno = errno;
1328 talloc_free(dgram);
1329 errno = saved_errno;
1330 return -1;
1333 #endif
1335 if (broadcast) {
1336 int val = 1;
1338 ret = setsockopt(fd, SOL_SOCKET, SO_BROADCAST,
1339 (const void *)&val, sizeof(val));
1340 if (ret == -1) {
1341 int saved_errno = errno;
1342 talloc_free(dgram);
1343 errno = saved_errno;
1344 return -1;
1348 if (do_reuseaddr) {
1349 int val = 1;
1351 ret = setsockopt(fd, SOL_SOCKET, SO_REUSEADDR,
1352 (const void *)&val, sizeof(val));
1353 if (ret == -1) {
1354 int saved_errno = errno;
1355 talloc_free(dgram);
1356 errno = saved_errno;
1357 return -1;
1361 if (do_bind) {
1362 ret = bind(fd, &lbsda->u.sa, lbsda->sa_socklen);
1363 if (ret == -1) {
1364 int saved_errno = errno;
1365 talloc_free(dgram);
1366 errno = saved_errno;
1367 return -1;
1371 if (rbsda) {
1372 if (rbsda->u.sa.sa_family != sa_fam) {
1373 talloc_free(dgram);
1374 errno = EINVAL;
1375 return -1;
1378 ret = connect(fd, &rbsda->u.sa, rbsda->sa_socklen);
1379 if (ret == -1) {
1380 int saved_errno = errno;
1381 talloc_free(dgram);
1382 errno = saved_errno;
1383 return -1;
1387 *_dgram = dgram;
1388 return 0;
1391 int _tdgram_bsd_existing_socket(TALLOC_CTX *mem_ctx,
1392 int fd,
1393 struct tdgram_context **_dgram,
1394 const char *location)
1396 struct tdgram_context *dgram;
1397 struct tdgram_bsd *bsds;
1399 dgram = tdgram_context_create(mem_ctx,
1400 &tdgram_bsd_ops,
1401 &bsds,
1402 struct tdgram_bsd,
1403 location);
1404 if (!dgram) {
1405 return -1;
1407 ZERO_STRUCTP(bsds);
1408 bsds->fd = fd;
1409 talloc_set_destructor(bsds, tdgram_bsd_destructor);
1411 *_dgram = dgram;
1412 return 0;
1415 int _tdgram_inet_udp_socket(const struct tsocket_address *local,
1416 const struct tsocket_address *remote,
1417 TALLOC_CTX *mem_ctx,
1418 struct tdgram_context **dgram,
1419 const char *location)
1421 struct tsocket_address_bsd *lbsda =
1422 talloc_get_type_abort(local->private_data,
1423 struct tsocket_address_bsd);
1424 int ret;
1426 switch (lbsda->u.sa.sa_family) {
1427 case AF_INET:
1428 break;
1429 #ifdef HAVE_IPV6
1430 case AF_INET6:
1431 break;
1432 #endif
1433 default:
1434 errno = EINVAL;
1435 return -1;
1438 ret = tdgram_bsd_dgram_socket(local, remote, false,
1439 mem_ctx, dgram, location);
1441 return ret;
1444 int _tdgram_unix_socket(const struct tsocket_address *local,
1445 const struct tsocket_address *remote,
1446 TALLOC_CTX *mem_ctx,
1447 struct tdgram_context **dgram,
1448 const char *location)
1450 struct tsocket_address_bsd *lbsda =
1451 talloc_get_type_abort(local->private_data,
1452 struct tsocket_address_bsd);
1453 int ret;
1455 switch (lbsda->u.sa.sa_family) {
1456 case AF_UNIX:
1457 break;
1458 default:
1459 errno = EINVAL;
1460 return -1;
1463 ret = tdgram_bsd_dgram_socket(local, remote, false,
1464 mem_ctx, dgram, location);
1466 return ret;
1469 struct tstream_bsd {
1470 int fd;
1472 void *event_ptr;
1473 struct tevent_fd *fde;
1474 bool optimize_readv;
1476 void *readable_private;
1477 void (*readable_handler)(void *private_data);
1478 void *writeable_private;
1479 void (*writeable_handler)(void *private_data);
1482 bool tstream_bsd_optimize_readv(struct tstream_context *stream,
1483 bool on)
1485 struct tstream_bsd *bsds =
1486 talloc_get_type(_tstream_context_data(stream),
1487 struct tstream_bsd);
1488 bool old;
1490 if (bsds == NULL) {
1491 /* not a bsd socket */
1492 return false;
1495 old = bsds->optimize_readv;
1496 bsds->optimize_readv = on;
1498 return old;
1501 static void tstream_bsd_fde_handler(struct tevent_context *ev,
1502 struct tevent_fd *fde,
1503 uint16_t flags,
1504 void *private_data)
1506 struct tstream_bsd *bsds = talloc_get_type_abort(private_data,
1507 struct tstream_bsd);
1509 if (flags & TEVENT_FD_WRITE) {
1510 bsds->writeable_handler(bsds->writeable_private);
1511 return;
1513 if (flags & TEVENT_FD_READ) {
1514 if (!bsds->readable_handler) {
1515 if (bsds->writeable_handler) {
1516 bsds->writeable_handler(bsds->writeable_private);
1517 return;
1519 TEVENT_FD_NOT_READABLE(bsds->fde);
1520 return;
1522 bsds->readable_handler(bsds->readable_private);
1523 return;
1527 static int tstream_bsd_set_readable_handler(struct tstream_bsd *bsds,
1528 struct tevent_context *ev,
1529 void (*handler)(void *private_data),
1530 void *private_data)
1532 if (ev == NULL) {
1533 if (handler) {
1534 errno = EINVAL;
1535 return -1;
1537 if (!bsds->readable_handler) {
1538 return 0;
1540 bsds->readable_handler = NULL;
1541 bsds->readable_private = NULL;
1543 return 0;
1546 /* read and write must use the same tevent_context */
1547 if (bsds->event_ptr != ev) {
1548 if (bsds->readable_handler || bsds->writeable_handler) {
1549 errno = EINVAL;
1550 return -1;
1552 bsds->event_ptr = NULL;
1553 TALLOC_FREE(bsds->fde);
1556 if (tevent_fd_get_flags(bsds->fde) == 0) {
1557 TALLOC_FREE(bsds->fde);
1559 bsds->fde = tevent_add_fd(ev, bsds,
1560 bsds->fd, TEVENT_FD_READ,
1561 tstream_bsd_fde_handler,
1562 bsds);
1563 if (!bsds->fde) {
1564 errno = ENOMEM;
1565 return -1;
1568 /* cache the event context we're running on */
1569 bsds->event_ptr = ev;
1570 } else if (!bsds->readable_handler) {
1571 TEVENT_FD_READABLE(bsds->fde);
1574 bsds->readable_handler = handler;
1575 bsds->readable_private = private_data;
1577 return 0;
1580 static int tstream_bsd_set_writeable_handler(struct tstream_bsd *bsds,
1581 struct tevent_context *ev,
1582 void (*handler)(void *private_data),
1583 void *private_data)
1585 if (ev == NULL) {
1586 if (handler) {
1587 errno = EINVAL;
1588 return -1;
1590 if (!bsds->writeable_handler) {
1591 return 0;
1593 bsds->writeable_handler = NULL;
1594 bsds->writeable_private = NULL;
1595 TEVENT_FD_NOT_WRITEABLE(bsds->fde);
1597 return 0;
1600 /* read and write must use the same tevent_context */
1601 if (bsds->event_ptr != ev) {
1602 if (bsds->readable_handler || bsds->writeable_handler) {
1603 errno = EINVAL;
1604 return -1;
1606 bsds->event_ptr = NULL;
1607 TALLOC_FREE(bsds->fde);
1610 if (tevent_fd_get_flags(bsds->fde) == 0) {
1611 TALLOC_FREE(bsds->fde);
1613 bsds->fde = tevent_add_fd(ev, bsds,
1614 bsds->fd,
1615 TEVENT_FD_READ | TEVENT_FD_WRITE,
1616 tstream_bsd_fde_handler,
1617 bsds);
1618 if (!bsds->fde) {
1619 errno = ENOMEM;
1620 return -1;
1623 /* cache the event context we're running on */
1624 bsds->event_ptr = ev;
1625 } else if (!bsds->writeable_handler) {
1626 uint16_t flags = tevent_fd_get_flags(bsds->fde);
1627 flags |= TEVENT_FD_READ | TEVENT_FD_WRITE;
1628 tevent_fd_set_flags(bsds->fde, flags);
1631 bsds->writeable_handler = handler;
1632 bsds->writeable_private = private_data;
1634 return 0;
1637 static ssize_t tstream_bsd_pending_bytes(struct tstream_context *stream)
1639 struct tstream_bsd *bsds = tstream_context_data(stream,
1640 struct tstream_bsd);
1641 ssize_t ret;
1643 if (bsds->fd == -1) {
1644 errno = ENOTCONN;
1645 return -1;
1648 ret = tsocket_bsd_pending(bsds->fd);
1650 return ret;
1653 struct tstream_bsd_readv_state {
1654 struct tstream_context *stream;
1656 struct iovec *vector;
1657 size_t count;
1659 int ret;
1662 static int tstream_bsd_readv_destructor(struct tstream_bsd_readv_state *state)
1664 struct tstream_bsd *bsds = tstream_context_data(state->stream,
1665 struct tstream_bsd);
1667 tstream_bsd_set_readable_handler(bsds, NULL, NULL, NULL);
1669 return 0;
1672 static void tstream_bsd_readv_handler(void *private_data);
1674 static struct tevent_req *tstream_bsd_readv_send(TALLOC_CTX *mem_ctx,
1675 struct tevent_context *ev,
1676 struct tstream_context *stream,
1677 struct iovec *vector,
1678 size_t count)
1680 struct tevent_req *req;
1681 struct tstream_bsd_readv_state *state;
1682 struct tstream_bsd *bsds = tstream_context_data(stream, struct tstream_bsd);
1683 int ret;
1685 req = tevent_req_create(mem_ctx, &state,
1686 struct tstream_bsd_readv_state);
1687 if (!req) {
1688 return NULL;
1691 state->stream = stream;
1692 /* we make a copy of the vector so that we can modify it */
1693 state->vector = talloc_array(state, struct iovec, count);
1694 if (tevent_req_nomem(state->vector, req)) {
1695 goto post;
1697 memcpy(state->vector, vector, sizeof(struct iovec)*count);
1698 state->count = count;
1699 state->ret = 0;
1701 talloc_set_destructor(state, tstream_bsd_readv_destructor);
1703 if (bsds->fd == -1) {
1704 tevent_req_error(req, ENOTCONN);
1705 goto post;
1709 * this is a fast path, not waiting for the
1710 * socket to become explicit readable gains
1711 * about 10%-20% performance in benchmark tests.
1713 if (bsds->optimize_readv) {
1715 * We only do the optimization on
1716 * readv if the caller asked for it.
1718 * This is needed because in most cases
1719 * we preferr to flush send buffers before
1720 * receiving incoming requests.
1722 tstream_bsd_readv_handler(req);
1723 if (!tevent_req_is_in_progress(req)) {
1724 goto post;
1728 ret = tstream_bsd_set_readable_handler(bsds, ev,
1729 tstream_bsd_readv_handler,
1730 req);
1731 if (ret == -1) {
1732 tevent_req_error(req, errno);
1733 goto post;
1736 return req;
1738 post:
1739 tevent_req_post(req, ev);
1740 return req;
1743 static void tstream_bsd_readv_handler(void *private_data)
1745 struct tevent_req *req = talloc_get_type_abort(private_data,
1746 struct tevent_req);
1747 struct tstream_bsd_readv_state *state = tevent_req_data(req,
1748 struct tstream_bsd_readv_state);
1749 struct tstream_context *stream = state->stream;
1750 struct tstream_bsd *bsds = tstream_context_data(stream, struct tstream_bsd);
1751 int ret;
1752 int err;
1753 int _count;
1754 bool ok, retry;
1756 ret = readv(bsds->fd, state->vector, state->count);
1757 if (ret == 0) {
1758 /* propagate end of file */
1759 tevent_req_error(req, EPIPE);
1760 return;
1762 err = tsocket_bsd_error_from_errno(ret, errno, &retry);
1763 if (retry) {
1764 /* retry later */
1765 return;
1767 if (tevent_req_error(req, err)) {
1768 return;
1771 state->ret += ret;
1773 _count = state->count; /* tstream has size_t count, readv has int */
1774 ok = iov_advance(&state->vector, &_count, ret);
1775 state->count = _count;
1777 if (!ok) {
1778 tevent_req_error(req, EINVAL);
1779 return;
1782 if (state->count > 0) {
1783 /* we have more to read */
1784 return;
1787 tevent_req_done(req);
1790 static int tstream_bsd_readv_recv(struct tevent_req *req,
1791 int *perrno)
1793 struct tstream_bsd_readv_state *state = tevent_req_data(req,
1794 struct tstream_bsd_readv_state);
1795 int ret;
1797 ret = tsocket_simple_int_recv(req, perrno);
1798 if (ret == 0) {
1799 ret = state->ret;
1802 tevent_req_received(req);
1803 return ret;
1806 struct tstream_bsd_writev_state {
1807 struct tstream_context *stream;
1809 struct iovec *vector;
1810 size_t count;
1812 int ret;
1815 static int tstream_bsd_writev_destructor(struct tstream_bsd_writev_state *state)
1817 struct tstream_bsd *bsds = tstream_context_data(state->stream,
1818 struct tstream_bsd);
1820 tstream_bsd_set_writeable_handler(bsds, NULL, NULL, NULL);
1822 return 0;
1825 static void tstream_bsd_writev_handler(void *private_data);
1827 static struct tevent_req *tstream_bsd_writev_send(TALLOC_CTX *mem_ctx,
1828 struct tevent_context *ev,
1829 struct tstream_context *stream,
1830 const struct iovec *vector,
1831 size_t count)
1833 struct tevent_req *req;
1834 struct tstream_bsd_writev_state *state;
1835 struct tstream_bsd *bsds = tstream_context_data(stream, struct tstream_bsd);
1836 int ret;
1838 req = tevent_req_create(mem_ctx, &state,
1839 struct tstream_bsd_writev_state);
1840 if (!req) {
1841 return NULL;
1844 state->stream = stream;
1845 /* we make a copy of the vector so that we can modify it */
1846 state->vector = talloc_array(state, struct iovec, count);
1847 if (tevent_req_nomem(state->vector, req)) {
1848 goto post;
1850 memcpy(state->vector, vector, sizeof(struct iovec)*count);
1851 state->count = count;
1852 state->ret = 0;
1854 talloc_set_destructor(state, tstream_bsd_writev_destructor);
1856 if (bsds->fd == -1) {
1857 tevent_req_error(req, ENOTCONN);
1858 goto post;
1862 * this is a fast path, not waiting for the
1863 * socket to become explicit writeable gains
1864 * about 10%-20% performance in benchmark tests.
1866 tstream_bsd_writev_handler(req);
1867 if (!tevent_req_is_in_progress(req)) {
1868 goto post;
1871 ret = tstream_bsd_set_writeable_handler(bsds, ev,
1872 tstream_bsd_writev_handler,
1873 req);
1874 if (ret == -1) {
1875 tevent_req_error(req, errno);
1876 goto post;
1879 return req;
1881 post:
1882 tevent_req_post(req, ev);
1883 return req;
1886 static void tstream_bsd_writev_handler(void *private_data)
1888 struct tevent_req *req = talloc_get_type_abort(private_data,
1889 struct tevent_req);
1890 struct tstream_bsd_writev_state *state = tevent_req_data(req,
1891 struct tstream_bsd_writev_state);
1892 struct tstream_context *stream = state->stream;
1893 struct tstream_bsd *bsds = tstream_context_data(stream, struct tstream_bsd);
1894 ssize_t ret;
1895 int err;
1896 int _count;
1897 bool ok, retry;
1899 ret = writev(bsds->fd, state->vector, state->count);
1900 if (ret == 0) {
1901 /* propagate end of file */
1902 tevent_req_error(req, EPIPE);
1903 return;
1905 err = tsocket_bsd_error_from_errno(ret, errno, &retry);
1906 if (retry) {
1907 /* retry later */
1908 return;
1910 if (tevent_req_error(req, err)) {
1911 return;
1914 state->ret += ret;
1916 _count = state->count; /* tstream has size_t count, writev has int */
1917 ok = iov_advance(&state->vector, &_count, ret);
1918 state->count = _count;
1920 if (!ok) {
1921 tevent_req_error(req, EINVAL);
1922 return;
1925 if (state->count > 0) {
1926 /* we have more to read */
1927 return;
1930 tevent_req_done(req);
1933 static int tstream_bsd_writev_recv(struct tevent_req *req, int *perrno)
1935 struct tstream_bsd_writev_state *state = tevent_req_data(req,
1936 struct tstream_bsd_writev_state);
1937 int ret;
1939 ret = tsocket_simple_int_recv(req, perrno);
1940 if (ret == 0) {
1941 ret = state->ret;
1944 tevent_req_received(req);
1945 return ret;
1948 struct tstream_bsd_disconnect_state {
1949 void *__dummy;
1952 static struct tevent_req *tstream_bsd_disconnect_send(TALLOC_CTX *mem_ctx,
1953 struct tevent_context *ev,
1954 struct tstream_context *stream)
1956 struct tstream_bsd *bsds = tstream_context_data(stream, struct tstream_bsd);
1957 struct tevent_req *req;
1958 struct tstream_bsd_disconnect_state *state;
1959 int ret;
1960 int err;
1961 bool dummy;
1963 req = tevent_req_create(mem_ctx, &state,
1964 struct tstream_bsd_disconnect_state);
1965 if (req == NULL) {
1966 return NULL;
1969 if (bsds->fd == -1) {
1970 tevent_req_error(req, ENOTCONN);
1971 goto post;
1974 TALLOC_FREE(bsds->fde);
1975 ret = close(bsds->fd);
1976 bsds->fd = -1;
1977 err = tsocket_bsd_error_from_errno(ret, errno, &dummy);
1978 if (tevent_req_error(req, err)) {
1979 goto post;
1982 tevent_req_done(req);
1983 post:
1984 tevent_req_post(req, ev);
1985 return req;
1988 static int tstream_bsd_disconnect_recv(struct tevent_req *req,
1989 int *perrno)
1991 int ret;
1993 ret = tsocket_simple_int_recv(req, perrno);
1995 tevent_req_received(req);
1996 return ret;
1999 static const struct tstream_context_ops tstream_bsd_ops = {
2000 .name = "bsd",
2002 .pending_bytes = tstream_bsd_pending_bytes,
2004 .readv_send = tstream_bsd_readv_send,
2005 .readv_recv = tstream_bsd_readv_recv,
2007 .writev_send = tstream_bsd_writev_send,
2008 .writev_recv = tstream_bsd_writev_recv,
2010 .disconnect_send = tstream_bsd_disconnect_send,
2011 .disconnect_recv = tstream_bsd_disconnect_recv,
2014 static int tstream_bsd_destructor(struct tstream_bsd *bsds)
2016 TALLOC_FREE(bsds->fde);
2017 if (bsds->fd != -1) {
2018 close(bsds->fd);
2019 bsds->fd = -1;
2021 return 0;
2024 int _tstream_bsd_existing_socket(TALLOC_CTX *mem_ctx,
2025 int fd,
2026 struct tstream_context **_stream,
2027 const char *location)
2029 struct tstream_context *stream;
2030 struct tstream_bsd *bsds;
2032 stream = tstream_context_create(mem_ctx,
2033 &tstream_bsd_ops,
2034 &bsds,
2035 struct tstream_bsd,
2036 location);
2037 if (!stream) {
2038 return -1;
2040 ZERO_STRUCTP(bsds);
2041 bsds->fd = fd;
2042 talloc_set_destructor(bsds, tstream_bsd_destructor);
2044 *_stream = stream;
2045 return 0;
2048 struct tstream_bsd_connect_state {
2049 int fd;
2050 struct tevent_fd *fde;
2051 struct tstream_conext *stream;
2052 struct tsocket_address *local;
2055 static int tstream_bsd_connect_destructor(struct tstream_bsd_connect_state *state)
2057 TALLOC_FREE(state->fde);
2058 if (state->fd != -1) {
2059 close(state->fd);
2060 state->fd = -1;
2063 return 0;
2066 static void tstream_bsd_connect_fde_handler(struct tevent_context *ev,
2067 struct tevent_fd *fde,
2068 uint16_t flags,
2069 void *private_data);
2071 static struct tevent_req *tstream_bsd_connect_send(TALLOC_CTX *mem_ctx,
2072 struct tevent_context *ev,
2073 int sys_errno,
2074 const struct tsocket_address *local,
2075 const struct tsocket_address *remote)
2077 struct tevent_req *req;
2078 struct tstream_bsd_connect_state *state;
2079 struct tsocket_address_bsd *lbsda =
2080 talloc_get_type_abort(local->private_data,
2081 struct tsocket_address_bsd);
2082 struct tsocket_address_bsd *lrbsda = NULL;
2083 struct tsocket_address_bsd *rbsda =
2084 talloc_get_type_abort(remote->private_data,
2085 struct tsocket_address_bsd);
2086 int ret;
2087 int err;
2088 bool retry;
2089 bool do_bind = false;
2090 bool do_reuseaddr = false;
2091 bool do_ipv6only = false;
2092 bool is_inet = false;
2093 int sa_fam = lbsda->u.sa.sa_family;
2095 req = tevent_req_create(mem_ctx, &state,
2096 struct tstream_bsd_connect_state);
2097 if (!req) {
2098 return NULL;
2100 state->fd = -1;
2101 state->fde = NULL;
2103 talloc_set_destructor(state, tstream_bsd_connect_destructor);
2105 /* give the wrappers a chance to report an error */
2106 if (sys_errno != 0) {
2107 tevent_req_error(req, sys_errno);
2108 goto post;
2111 switch (lbsda->u.sa.sa_family) {
2112 case AF_UNIX:
2113 if (lbsda->u.un.sun_path[0] != 0) {
2114 do_reuseaddr = true;
2115 do_bind = true;
2117 break;
2118 case AF_INET:
2119 if (lbsda->u.in.sin_port != 0) {
2120 do_reuseaddr = true;
2121 do_bind = true;
2123 if (lbsda->u.in.sin_addr.s_addr != INADDR_ANY) {
2124 do_bind = true;
2126 is_inet = true;
2127 break;
2128 #ifdef HAVE_IPV6
2129 case AF_INET6:
2130 if (lbsda->u.in6.sin6_port != 0) {
2131 do_reuseaddr = true;
2132 do_bind = true;
2134 if (memcmp(&in6addr_any,
2135 &lbsda->u.in6.sin6_addr,
2136 sizeof(in6addr_any)) != 0) {
2137 do_bind = true;
2139 is_inet = true;
2140 do_ipv6only = true;
2141 break;
2142 #endif
2143 default:
2144 tevent_req_error(req, EINVAL);
2145 goto post;
2148 if (!do_bind && is_inet) {
2149 sa_fam = rbsda->u.sa.sa_family;
2150 switch (sa_fam) {
2151 case AF_INET:
2152 do_ipv6only = false;
2153 break;
2154 #ifdef HAVE_IPV6
2155 case AF_INET6:
2156 do_ipv6only = true;
2157 break;
2158 #endif
2162 if (is_inet) {
2163 state->local = tsocket_address_create(state,
2164 &tsocket_address_bsd_ops,
2165 &lrbsda,
2166 struct tsocket_address_bsd,
2167 __location__ "bsd_connect");
2168 if (tevent_req_nomem(state->local, req)) {
2169 goto post;
2172 ZERO_STRUCTP(lrbsda);
2173 lrbsda->sa_socklen = sizeof(lrbsda->u.ss);
2174 #ifdef HAVE_STRUCT_SOCKADDR_SA_LEN
2175 lrbsda->u.sa.sa_len = lrbsda->sa_socklen;
2176 #endif
2179 state->fd = socket(sa_fam, SOCK_STREAM, 0);
2180 if (state->fd == -1) {
2181 tevent_req_error(req, errno);
2182 goto post;
2185 state->fd = tsocket_bsd_common_prepare_fd(state->fd, true);
2186 if (state->fd == -1) {
2187 tevent_req_error(req, errno);
2188 goto post;
2191 #ifdef HAVE_IPV6
2192 if (do_ipv6only) {
2193 int val = 1;
2195 ret = setsockopt(state->fd, IPPROTO_IPV6, IPV6_V6ONLY,
2196 (const void *)&val, sizeof(val));
2197 if (ret == -1) {
2198 tevent_req_error(req, errno);
2199 goto post;
2202 #endif
2204 if (do_reuseaddr) {
2205 int val = 1;
2207 ret = setsockopt(state->fd, SOL_SOCKET, SO_REUSEADDR,
2208 (const void *)&val, sizeof(val));
2209 if (ret == -1) {
2210 tevent_req_error(req, errno);
2211 goto post;
2215 if (do_bind) {
2216 ret = bind(state->fd, &lbsda->u.sa, lbsda->sa_socklen);
2217 if (ret == -1) {
2218 tevent_req_error(req, errno);
2219 goto post;
2223 if (rbsda->u.sa.sa_family != sa_fam) {
2224 tevent_req_error(req, EINVAL);
2225 goto post;
2228 ret = connect(state->fd, &rbsda->u.sa, rbsda->sa_socklen);
2229 err = tsocket_bsd_error_from_errno(ret, errno, &retry);
2230 if (retry) {
2231 /* retry later */
2232 goto async;
2234 if (tevent_req_error(req, err)) {
2235 goto post;
2238 if (!state->local) {
2239 tevent_req_done(req);
2240 goto post;
2243 ret = getsockname(state->fd, &lrbsda->u.sa, &lrbsda->sa_socklen);
2244 if (ret == -1) {
2245 tevent_req_error(req, errno);
2246 goto post;
2249 tevent_req_done(req);
2250 goto post;
2252 async:
2253 state->fde = tevent_add_fd(ev, state,
2254 state->fd,
2255 TEVENT_FD_READ | TEVENT_FD_WRITE,
2256 tstream_bsd_connect_fde_handler,
2257 req);
2258 if (tevent_req_nomem(state->fde, req)) {
2259 goto post;
2262 return req;
2264 post:
2265 tevent_req_post(req, ev);
2266 return req;
2269 static void tstream_bsd_connect_fde_handler(struct tevent_context *ev,
2270 struct tevent_fd *fde,
2271 uint16_t flags,
2272 void *private_data)
2274 struct tevent_req *req = talloc_get_type_abort(private_data,
2275 struct tevent_req);
2276 struct tstream_bsd_connect_state *state = tevent_req_data(req,
2277 struct tstream_bsd_connect_state);
2278 struct tsocket_address_bsd *lrbsda = NULL;
2279 int ret;
2280 int error=0;
2281 socklen_t len = sizeof(error);
2282 int err;
2283 bool retry;
2285 ret = getsockopt(state->fd, SOL_SOCKET, SO_ERROR, &error, &len);
2286 if (ret == 0) {
2287 if (error != 0) {
2288 errno = error;
2289 ret = -1;
2292 err = tsocket_bsd_error_from_errno(ret, errno, &retry);
2293 if (retry) {
2294 /* retry later */
2295 return;
2297 if (tevent_req_error(req, err)) {
2298 return;
2301 if (!state->local) {
2302 tevent_req_done(req);
2303 return;
2306 lrbsda = talloc_get_type_abort(state->local->private_data,
2307 struct tsocket_address_bsd);
2309 ret = getsockname(state->fd, &lrbsda->u.sa, &lrbsda->sa_socklen);
2310 if (ret == -1) {
2311 tevent_req_error(req, errno);
2312 return;
2315 tevent_req_done(req);
2318 static int tstream_bsd_connect_recv(struct tevent_req *req,
2319 int *perrno,
2320 TALLOC_CTX *mem_ctx,
2321 struct tstream_context **stream,
2322 struct tsocket_address **local,
2323 const char *location)
2325 struct tstream_bsd_connect_state *state = tevent_req_data(req,
2326 struct tstream_bsd_connect_state);
2327 int ret;
2329 ret = tsocket_simple_int_recv(req, perrno);
2330 if (ret == 0) {
2331 ret = _tstream_bsd_existing_socket(mem_ctx,
2332 state->fd,
2333 stream,
2334 location);
2335 if (ret == -1) {
2336 *perrno = errno;
2337 goto done;
2339 TALLOC_FREE(state->fde);
2340 state->fd = -1;
2342 if (local) {
2343 *local = talloc_move(mem_ctx, &state->local);
2347 done:
2348 tevent_req_received(req);
2349 return ret;
2352 struct tevent_req * tstream_inet_tcp_connect_send(TALLOC_CTX *mem_ctx,
2353 struct tevent_context *ev,
2354 const struct tsocket_address *local,
2355 const struct tsocket_address *remote)
2357 struct tsocket_address_bsd *lbsda =
2358 talloc_get_type_abort(local->private_data,
2359 struct tsocket_address_bsd);
2360 struct tevent_req *req;
2361 int sys_errno = 0;
2363 switch (lbsda->u.sa.sa_family) {
2364 case AF_INET:
2365 break;
2366 #ifdef HAVE_IPV6
2367 case AF_INET6:
2368 break;
2369 #endif
2370 default:
2371 sys_errno = EINVAL;
2372 break;
2375 req = tstream_bsd_connect_send(mem_ctx, ev, sys_errno, local, remote);
2377 return req;
2380 int _tstream_inet_tcp_connect_recv(struct tevent_req *req,
2381 int *perrno,
2382 TALLOC_CTX *mem_ctx,
2383 struct tstream_context **stream,
2384 struct tsocket_address **local,
2385 const char *location)
2387 return tstream_bsd_connect_recv(req, perrno,
2388 mem_ctx, stream, local,
2389 location);
2392 struct tevent_req * tstream_unix_connect_send(TALLOC_CTX *mem_ctx,
2393 struct tevent_context *ev,
2394 const struct tsocket_address *local,
2395 const struct tsocket_address *remote)
2397 struct tsocket_address_bsd *lbsda =
2398 talloc_get_type_abort(local->private_data,
2399 struct tsocket_address_bsd);
2400 struct tevent_req *req;
2401 int sys_errno = 0;
2403 switch (lbsda->u.sa.sa_family) {
2404 case AF_UNIX:
2405 break;
2406 default:
2407 sys_errno = EINVAL;
2408 break;
2411 req = tstream_bsd_connect_send(mem_ctx, ev, sys_errno, local, remote);
2413 return req;
2416 int _tstream_unix_connect_recv(struct tevent_req *req,
2417 int *perrno,
2418 TALLOC_CTX *mem_ctx,
2419 struct tstream_context **stream,
2420 const char *location)
2422 return tstream_bsd_connect_recv(req, perrno,
2423 mem_ctx, stream, NULL,
2424 location);
2427 int _tstream_unix_socketpair(TALLOC_CTX *mem_ctx1,
2428 struct tstream_context **_stream1,
2429 TALLOC_CTX *mem_ctx2,
2430 struct tstream_context **_stream2,
2431 const char *location)
2433 int ret;
2434 int fds[2];
2435 int fd1;
2436 int fd2;
2437 struct tstream_context *stream1 = NULL;
2438 struct tstream_context *stream2 = NULL;
2440 ret = socketpair(AF_UNIX, SOCK_STREAM, 0, fds);
2441 if (ret == -1) {
2442 return -1;
2444 fd1 = fds[0];
2445 fd2 = fds[1];
2447 fd1 = tsocket_bsd_common_prepare_fd(fd1, true);
2448 if (fd1 == -1) {
2449 int sys_errno = errno;
2450 close(fd2);
2451 errno = sys_errno;
2452 return -1;
2455 fd2 = tsocket_bsd_common_prepare_fd(fd2, true);
2456 if (fd2 == -1) {
2457 int sys_errno = errno;
2458 close(fd1);
2459 errno = sys_errno;
2460 return -1;
2463 ret = _tstream_bsd_existing_socket(mem_ctx1,
2464 fd1,
2465 &stream1,
2466 location);
2467 if (ret == -1) {
2468 int sys_errno = errno;
2469 close(fd1);
2470 close(fd2);
2471 errno = sys_errno;
2472 return -1;
2475 ret = _tstream_bsd_existing_socket(mem_ctx2,
2476 fd2,
2477 &stream2,
2478 location);
2479 if (ret == -1) {
2480 int sys_errno = errno;
2481 talloc_free(stream1);
2482 close(fd2);
2483 errno = sys_errno;
2484 return -1;
2487 *_stream1 = stream1;
2488 *_stream2 = stream2;
2489 return 0;