xref: /freebsd/contrib/unbound/util/netevent.c (revision b7c0c8c18e0f12bc22e251fbcabad719b364a38a)
1b7579f77SDag-Erling Smørgrav /*
2b7579f77SDag-Erling Smørgrav  * util/netevent.c - event notification
3b7579f77SDag-Erling Smørgrav  *
4b7579f77SDag-Erling Smørgrav  * Copyright (c) 2007, NLnet Labs. All rights reserved.
5b7579f77SDag-Erling Smørgrav  *
6b7579f77SDag-Erling Smørgrav  * This software is open source.
7b7579f77SDag-Erling Smørgrav  *
8b7579f77SDag-Erling Smørgrav  * Redistribution and use in source and binary forms, with or without
9b7579f77SDag-Erling Smørgrav  * modification, are permitted provided that the following conditions
10b7579f77SDag-Erling Smørgrav  * are met:
11b7579f77SDag-Erling Smørgrav  *
12b7579f77SDag-Erling Smørgrav  * Redistributions of source code must retain the above copyright notice,
13b7579f77SDag-Erling Smørgrav  * this list of conditions and the following disclaimer.
14b7579f77SDag-Erling Smørgrav  *
15b7579f77SDag-Erling Smørgrav  * Redistributions in binary form must reproduce the above copyright notice,
16b7579f77SDag-Erling Smørgrav  * this list of conditions and the following disclaimer in the documentation
17b7579f77SDag-Erling Smørgrav  * and/or other materials provided with the distribution.
18b7579f77SDag-Erling Smørgrav  *
19b7579f77SDag-Erling Smørgrav  * Neither the name of the NLNET LABS nor the names of its contributors may
20b7579f77SDag-Erling Smørgrav  * be used to endorse or promote products derived from this software without
21b7579f77SDag-Erling Smørgrav  * specific prior written permission.
22b7579f77SDag-Erling Smørgrav  *
23b7579f77SDag-Erling Smørgrav  * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
2417d15b25SDag-Erling Smørgrav  * "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
2517d15b25SDag-Erling Smørgrav  * LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
2617d15b25SDag-Erling Smørgrav  * A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
2717d15b25SDag-Erling Smørgrav  * HOLDER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
2817d15b25SDag-Erling Smørgrav  * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED
2917d15b25SDag-Erling Smørgrav  * TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR
3017d15b25SDag-Erling Smørgrav  * PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF
3117d15b25SDag-Erling Smørgrav  * LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING
3217d15b25SDag-Erling Smørgrav  * NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
3317d15b25SDag-Erling Smørgrav  * SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
34b7579f77SDag-Erling Smørgrav  */
35b7579f77SDag-Erling Smørgrav 
36b7579f77SDag-Erling Smørgrav /**
37b7579f77SDag-Erling Smørgrav  * \file
38b7579f77SDag-Erling Smørgrav  *
39b7579f77SDag-Erling Smørgrav  * This file contains event notification functions.
40b7579f77SDag-Erling Smørgrav  */
41b7579f77SDag-Erling Smørgrav #include "config.h"
42b7579f77SDag-Erling Smørgrav #include "util/netevent.h"
43e2d15004SDag-Erling Smørgrav #include "util/ub_event.h"
44b7579f77SDag-Erling Smørgrav #include "util/log.h"
45b7579f77SDag-Erling Smørgrav #include "util/net_help.h"
464c75e3aaSDag-Erling Smørgrav #include "util/tcp_conn_limit.h"
47b7579f77SDag-Erling Smørgrav #include "util/fptr_wlist.h"
48865f46b2SCy Schubert #include "util/proxy_protocol.h"
498f76bb7dSCy Schubert #include "util/timeval_func.h"
5009a3aaf3SDag-Erling Smørgrav #include "sldns/pkthdr.h"
5109a3aaf3SDag-Erling Smørgrav #include "sldns/sbuffer.h"
520fb34990SDag-Erling Smørgrav #include "sldns/str2wire.h"
53ff825849SDag-Erling Smørgrav #include "dnstap/dnstap.h"
5465b390aaSDag-Erling Smørgrav #include "dnscrypt/dnscrypt.h"
55e86b9096SDag-Erling Smørgrav #include "services/listen_dnsport.h"
565469a995SCy Schubert #ifdef HAVE_SYS_TYPES_H
575469a995SCy Schubert #include <sys/types.h>
585469a995SCy Schubert #endif
595469a995SCy Schubert #ifdef HAVE_SYS_SOCKET_H
605469a995SCy Schubert #include <sys/socket.h>
615469a995SCy Schubert #endif
625469a995SCy Schubert #ifdef HAVE_NETDB_H
635469a995SCy Schubert #include <netdb.h>
645469a995SCy Schubert #endif
65865f46b2SCy Schubert #ifdef HAVE_POLL_H
66865f46b2SCy Schubert #include <poll.h>
67865f46b2SCy Schubert #endif
685469a995SCy Schubert 
698ed2b524SDag-Erling Smørgrav #ifdef HAVE_OPENSSL_SSL_H
70b7579f77SDag-Erling Smørgrav #include <openssl/ssl.h>
718ed2b524SDag-Erling Smørgrav #endif
728ed2b524SDag-Erling Smørgrav #ifdef HAVE_OPENSSL_ERR_H
73b7579f77SDag-Erling Smørgrav #include <openssl/err.h>
748ed2b524SDag-Erling Smørgrav #endif
758f76bb7dSCy Schubert #ifdef HAVE_LINUX_NET_TSTAMP_H
768f76bb7dSCy Schubert #include <linux/net_tstamp.h>
778f76bb7dSCy Schubert #endif
78b7579f77SDag-Erling Smørgrav /* -------- Start of local definitions -------- */
79b7579f77SDag-Erling Smørgrav /** if CMSG_ALIGN is not defined on this platform, a workaround */
80b7579f77SDag-Erling Smørgrav #ifndef CMSG_ALIGN
81f61ef7f6SDag-Erling Smørgrav #  ifdef __CMSG_ALIGN
82f61ef7f6SDag-Erling Smørgrav #    define CMSG_ALIGN(n) __CMSG_ALIGN(n)
83f61ef7f6SDag-Erling Smørgrav #  elif defined(CMSG_DATA_ALIGN)
84b7579f77SDag-Erling Smørgrav #    define CMSG_ALIGN _CMSG_DATA_ALIGN
85b7579f77SDag-Erling Smørgrav #  else
86b7579f77SDag-Erling Smørgrav #    define CMSG_ALIGN(len) (((len)+sizeof(long)-1) & ~(sizeof(long)-1))
87b7579f77SDag-Erling Smørgrav #  endif
88b7579f77SDag-Erling Smørgrav #endif
89b7579f77SDag-Erling Smørgrav 
90b7579f77SDag-Erling Smørgrav /** if CMSG_LEN is not defined on this platform, a workaround */
91b7579f77SDag-Erling Smørgrav #ifndef CMSG_LEN
92b7579f77SDag-Erling Smørgrav #  define CMSG_LEN(len) (CMSG_ALIGN(sizeof(struct cmsghdr))+(len))
93b7579f77SDag-Erling Smørgrav #endif
94b7579f77SDag-Erling Smørgrav 
95b7579f77SDag-Erling Smørgrav /** if CMSG_SPACE is not defined on this platform, a workaround */
96b7579f77SDag-Erling Smørgrav #ifndef CMSG_SPACE
97b7579f77SDag-Erling Smørgrav #  ifdef _CMSG_HDR_ALIGN
98b7579f77SDag-Erling Smørgrav #    define CMSG_SPACE(l) (CMSG_ALIGN(l)+_CMSG_HDR_ALIGN(sizeof(struct cmsghdr)))
99b7579f77SDag-Erling Smørgrav #  else
100b7579f77SDag-Erling Smørgrav #    define CMSG_SPACE(l) (CMSG_ALIGN(l)+CMSG_ALIGN(sizeof(struct cmsghdr)))
101b7579f77SDag-Erling Smørgrav #  endif
102b7579f77SDag-Erling Smørgrav #endif
103b7579f77SDag-Erling Smørgrav 
1044c75e3aaSDag-Erling Smørgrav /** The TCP writing query timeout in milliseconds */
105b5663de9SDag-Erling Smørgrav #define TCP_QUERY_TIMEOUT 120000
1064c75e3aaSDag-Erling Smørgrav /** The minimum actual TCP timeout to use, regardless of what we advertise,
1074c75e3aaSDag-Erling Smørgrav  * in msec */
1084c75e3aaSDag-Erling Smørgrav #define TCP_QUERY_TIMEOUT_MINIMUM 200
109b7579f77SDag-Erling Smørgrav 
110b7579f77SDag-Erling Smørgrav #ifndef NONBLOCKING_IS_BROKEN
111b7579f77SDag-Erling Smørgrav /** number of UDP reads to perform per read indication from select */
112b7579f77SDag-Erling Smørgrav #define NUM_UDP_PER_SELECT 100
113b7579f77SDag-Erling Smørgrav #else
114b7579f77SDag-Erling Smørgrav #define NUM_UDP_PER_SELECT 1
115b7579f77SDag-Erling Smørgrav #endif
116b7579f77SDag-Erling Smørgrav 
117865f46b2SCy Schubert /** timeout in millisec to wait for write to unblock, packets dropped after.*/
118865f46b2SCy Schubert #define SEND_BLOCKED_WAIT_TIMEOUT 200
1196e71235eSCy Schubert /** max number of times to wait for write to unblock, packets dropped after.*/
1206e71235eSCy Schubert #define SEND_BLOCKED_MAX_RETRY 5
121865f46b2SCy Schubert 
1228f76bb7dSCy Schubert /** Let's make timestamping code cleaner and redefine SO_TIMESTAMP* */
1238f76bb7dSCy Schubert #ifndef SO_TIMESTAMP
1248f76bb7dSCy Schubert #define SO_TIMESTAMP 29
1258f76bb7dSCy Schubert #endif
1268f76bb7dSCy Schubert #ifndef SO_TIMESTAMPNS
1278f76bb7dSCy Schubert #define SO_TIMESTAMPNS 35
1288f76bb7dSCy Schubert #endif
1298f76bb7dSCy Schubert #ifndef SO_TIMESTAMPING
1308f76bb7dSCy Schubert #define SO_TIMESTAMPING 37
1318f76bb7dSCy Schubert #endif
132b7579f77SDag-Erling Smørgrav /**
133e2d15004SDag-Erling Smørgrav  * The internal event structure for keeping ub_event info for the event.
134b7579f77SDag-Erling Smørgrav  * Possibly other structures (list, tree) this is part of.
135b7579f77SDag-Erling Smørgrav  */
136b7579f77SDag-Erling Smørgrav struct internal_event {
137b7579f77SDag-Erling Smørgrav 	/** the comm base */
138b7579f77SDag-Erling Smørgrav 	struct comm_base* base;
139e2d15004SDag-Erling Smørgrav 	/** ub_event event type */
140e2d15004SDag-Erling Smørgrav 	struct ub_event* ev;
141b7579f77SDag-Erling Smørgrav };
142b7579f77SDag-Erling Smørgrav 
143b7579f77SDag-Erling Smørgrav /**
144b7579f77SDag-Erling Smørgrav  * Internal base structure, so that every thread has its own events.
145b7579f77SDag-Erling Smørgrav  */
146b7579f77SDag-Erling Smørgrav struct internal_base {
147e2d15004SDag-Erling Smørgrav 	/** ub_event event_base type. */
148e2d15004SDag-Erling Smørgrav 	struct ub_event_base* base;
149b7579f77SDag-Erling Smørgrav 	/** seconds time pointer points here */
15017d15b25SDag-Erling Smørgrav 	time_t secs;
151b7579f77SDag-Erling Smørgrav 	/** timeval with current time */
152b7579f77SDag-Erling Smørgrav 	struct timeval now;
153b7579f77SDag-Erling Smørgrav 	/** the event used for slow_accept timeouts */
154e2d15004SDag-Erling Smørgrav 	struct ub_event* slow_accept;
155b7579f77SDag-Erling Smørgrav 	/** true if slow_accept is enabled */
156b7579f77SDag-Erling Smørgrav 	int slow_accept_enabled;
157865f46b2SCy Schubert 	/** last log time for slow logging of file descriptor errors */
158865f46b2SCy Schubert 	time_t last_slow_log;
159865f46b2SCy Schubert 	/** last log time for slow logging of write wait failures */
160865f46b2SCy Schubert 	time_t last_writewait_log;
161b7579f77SDag-Erling Smørgrav };
162b7579f77SDag-Erling Smørgrav 
163b7579f77SDag-Erling Smørgrav /**
164b7579f77SDag-Erling Smørgrav  * Internal timer structure, to store timer event in.
165b7579f77SDag-Erling Smørgrav  */
166b7579f77SDag-Erling Smørgrav struct internal_timer {
167e2d15004SDag-Erling Smørgrav 	/** the super struct from which derived */
168e2d15004SDag-Erling Smørgrav 	struct comm_timer super;
169b7579f77SDag-Erling Smørgrav 	/** the comm base */
170b7579f77SDag-Erling Smørgrav 	struct comm_base* base;
171e2d15004SDag-Erling Smørgrav 	/** ub_event event type */
172e2d15004SDag-Erling Smørgrav 	struct ub_event* ev;
173b7579f77SDag-Erling Smørgrav 	/** is timer enabled */
174b7579f77SDag-Erling Smørgrav 	uint8_t enabled;
175b7579f77SDag-Erling Smørgrav };
176b7579f77SDag-Erling Smørgrav 
177b7579f77SDag-Erling Smørgrav /**
178b7579f77SDag-Erling Smørgrav  * Internal signal structure, to store signal event in.
179b7579f77SDag-Erling Smørgrav  */
180b7579f77SDag-Erling Smørgrav struct internal_signal {
181e2d15004SDag-Erling Smørgrav 	/** ub_event event type */
182e2d15004SDag-Erling Smørgrav 	struct ub_event* ev;
183b7579f77SDag-Erling Smørgrav 	/** next in signal list */
184b7579f77SDag-Erling Smørgrav 	struct internal_signal* next;
185b7579f77SDag-Erling Smørgrav };
186b7579f77SDag-Erling Smørgrav 
187b7579f77SDag-Erling Smørgrav /** create a tcp handler with a parent */
188b7579f77SDag-Erling Smørgrav static struct comm_point* comm_point_create_tcp_handler(
189b7579f77SDag-Erling Smørgrav 	struct comm_base *base, struct comm_point* parent, size_t bufsize,
190e86b9096SDag-Erling Smørgrav 	struct sldns_buffer* spoolbuf, comm_point_callback_type* callback,
1915469a995SCy Schubert 	void* callback_arg, struct unbound_socket* socket);
192b7579f77SDag-Erling Smørgrav 
193b7579f77SDag-Erling Smørgrav /* -------- End of local definitions -------- */
194b7579f77SDag-Erling Smørgrav 
195b7579f77SDag-Erling Smørgrav struct comm_base*
196b7579f77SDag-Erling Smørgrav comm_base_create(int sigs)
197b7579f77SDag-Erling Smørgrav {
198b7579f77SDag-Erling Smørgrav 	struct comm_base* b = (struct comm_base*)calloc(1,
199b7579f77SDag-Erling Smørgrav 		sizeof(struct comm_base));
200e2d15004SDag-Erling Smørgrav 	const char *evnm="event", *evsys="", *evmethod="";
201e2d15004SDag-Erling Smørgrav 
202b7579f77SDag-Erling Smørgrav 	if(!b)
203b7579f77SDag-Erling Smørgrav 		return NULL;
204b7579f77SDag-Erling Smørgrav 	b->eb = (struct internal_base*)calloc(1, sizeof(struct internal_base));
205b7579f77SDag-Erling Smørgrav 	if(!b->eb) {
206b7579f77SDag-Erling Smørgrav 		free(b);
207b7579f77SDag-Erling Smørgrav 		return NULL;
208b7579f77SDag-Erling Smørgrav 	}
209e2d15004SDag-Erling Smørgrav 	b->eb->base = ub_default_event_base(sigs, &b->eb->secs, &b->eb->now);
210b7579f77SDag-Erling Smørgrav 	if(!b->eb->base) {
211b7579f77SDag-Erling Smørgrav 		free(b->eb);
212b7579f77SDag-Erling Smørgrav 		free(b);
213b7579f77SDag-Erling Smørgrav 		return NULL;
214b7579f77SDag-Erling Smørgrav 	}
215e2d15004SDag-Erling Smørgrav 	ub_comm_base_now(b);
216e2d15004SDag-Erling Smørgrav 	ub_get_event_sys(b->eb->base, &evnm, &evsys, &evmethod);
217e86b9096SDag-Erling Smørgrav 	verbose(VERB_ALGO, "%s %s uses %s method.", evnm, evsys, evmethod);
218b7579f77SDag-Erling Smørgrav 	return b;
219b7579f77SDag-Erling Smørgrav }
220b7579f77SDag-Erling Smørgrav 
22117d15b25SDag-Erling Smørgrav struct comm_base*
222e2d15004SDag-Erling Smørgrav comm_base_create_event(struct ub_event_base* base)
22317d15b25SDag-Erling Smørgrav {
22417d15b25SDag-Erling Smørgrav 	struct comm_base* b = (struct comm_base*)calloc(1,
22517d15b25SDag-Erling Smørgrav 		sizeof(struct comm_base));
22617d15b25SDag-Erling Smørgrav 	if(!b)
22717d15b25SDag-Erling Smørgrav 		return NULL;
22817d15b25SDag-Erling Smørgrav 	b->eb = (struct internal_base*)calloc(1, sizeof(struct internal_base));
22917d15b25SDag-Erling Smørgrav 	if(!b->eb) {
23017d15b25SDag-Erling Smørgrav 		free(b);
23117d15b25SDag-Erling Smørgrav 		return NULL;
23217d15b25SDag-Erling Smørgrav 	}
23317d15b25SDag-Erling Smørgrav 	b->eb->base = base;
234e2d15004SDag-Erling Smørgrav 	ub_comm_base_now(b);
23517d15b25SDag-Erling Smørgrav 	return b;
23617d15b25SDag-Erling Smørgrav }
23717d15b25SDag-Erling Smørgrav 
238b7579f77SDag-Erling Smørgrav void
239b7579f77SDag-Erling Smørgrav comm_base_delete(struct comm_base* b)
240b7579f77SDag-Erling Smørgrav {
241b7579f77SDag-Erling Smørgrav 	if(!b)
242b7579f77SDag-Erling Smørgrav 		return;
243b7579f77SDag-Erling Smørgrav 	if(b->eb->slow_accept_enabled) {
244e2d15004SDag-Erling Smørgrav 		if(ub_event_del(b->eb->slow_accept) != 0) {
245b7579f77SDag-Erling Smørgrav 			log_err("could not event_del slow_accept");
246b7579f77SDag-Erling Smørgrav 		}
247e2d15004SDag-Erling Smørgrav 		ub_event_free(b->eb->slow_accept);
248b7579f77SDag-Erling Smørgrav 	}
249e2d15004SDag-Erling Smørgrav 	ub_event_base_free(b->eb->base);
250b7579f77SDag-Erling Smørgrav 	b->eb->base = NULL;
251b7579f77SDag-Erling Smørgrav 	free(b->eb);
252b7579f77SDag-Erling Smørgrav 	free(b);
253b7579f77SDag-Erling Smørgrav }
254b7579f77SDag-Erling Smørgrav 
255b7579f77SDag-Erling Smørgrav void
25617d15b25SDag-Erling Smørgrav comm_base_delete_no_base(struct comm_base* b)
25717d15b25SDag-Erling Smørgrav {
25817d15b25SDag-Erling Smørgrav 	if(!b)
25917d15b25SDag-Erling Smørgrav 		return;
26017d15b25SDag-Erling Smørgrav 	if(b->eb->slow_accept_enabled) {
261e2d15004SDag-Erling Smørgrav 		if(ub_event_del(b->eb->slow_accept) != 0) {
26217d15b25SDag-Erling Smørgrav 			log_err("could not event_del slow_accept");
26317d15b25SDag-Erling Smørgrav 		}
264e2d15004SDag-Erling Smørgrav 		ub_event_free(b->eb->slow_accept);
26517d15b25SDag-Erling Smørgrav 	}
26617d15b25SDag-Erling Smørgrav 	b->eb->base = NULL;
26717d15b25SDag-Erling Smørgrav 	free(b->eb);
26817d15b25SDag-Erling Smørgrav 	free(b);
26917d15b25SDag-Erling Smørgrav }
27017d15b25SDag-Erling Smørgrav 
27117d15b25SDag-Erling Smørgrav void
27217d15b25SDag-Erling Smørgrav comm_base_timept(struct comm_base* b, time_t** tt, struct timeval** tv)
273b7579f77SDag-Erling Smørgrav {
274b7579f77SDag-Erling Smørgrav 	*tt = &b->eb->secs;
275b7579f77SDag-Erling Smørgrav 	*tv = &b->eb->now;
276b7579f77SDag-Erling Smørgrav }
277b7579f77SDag-Erling Smørgrav 
278b7579f77SDag-Erling Smørgrav void
279b7579f77SDag-Erling Smørgrav comm_base_dispatch(struct comm_base* b)
280b7579f77SDag-Erling Smørgrav {
281b7579f77SDag-Erling Smørgrav 	int retval;
282e2d15004SDag-Erling Smørgrav 	retval = ub_event_base_dispatch(b->eb->base);
283e2d15004SDag-Erling Smørgrav 	if(retval < 0) {
284b7579f77SDag-Erling Smørgrav 		fatal_exit("event_dispatch returned error %d, "
285b7579f77SDag-Erling Smørgrav 			"errno is %s", retval, strerror(errno));
286b7579f77SDag-Erling Smørgrav 	}
287b7579f77SDag-Erling Smørgrav }
288b7579f77SDag-Erling Smørgrav 
289b7579f77SDag-Erling Smørgrav void comm_base_exit(struct comm_base* b)
290b7579f77SDag-Erling Smørgrav {
291e2d15004SDag-Erling Smørgrav 	if(ub_event_base_loopexit(b->eb->base) != 0) {
292b7579f77SDag-Erling Smørgrav 		log_err("Could not loopexit");
293b7579f77SDag-Erling Smørgrav 	}
294b7579f77SDag-Erling Smørgrav }
295b7579f77SDag-Erling Smørgrav 
296b7579f77SDag-Erling Smørgrav void comm_base_set_slow_accept_handlers(struct comm_base* b,
297b7579f77SDag-Erling Smørgrav 	void (*stop_acc)(void*), void (*start_acc)(void*), void* arg)
298b7579f77SDag-Erling Smørgrav {
299b7579f77SDag-Erling Smørgrav 	b->stop_accept = stop_acc;
300b7579f77SDag-Erling Smørgrav 	b->start_accept = start_acc;
301b7579f77SDag-Erling Smørgrav 	b->cb_arg = arg;
302b7579f77SDag-Erling Smørgrav }
303b7579f77SDag-Erling Smørgrav 
304e2d15004SDag-Erling Smørgrav struct ub_event_base* comm_base_internal(struct comm_base* b)
305b7579f77SDag-Erling Smørgrav {
306b7579f77SDag-Erling Smørgrav 	return b->eb->base;
307b7579f77SDag-Erling Smørgrav }
308b7579f77SDag-Erling Smørgrav 
309b7579f77SDag-Erling Smørgrav /** see if errno for udp has to be logged or not uses globals */
310b7579f77SDag-Erling Smørgrav static int
311b7579f77SDag-Erling Smørgrav udp_send_errno_needs_log(struct sockaddr* addr, socklen_t addrlen)
312b7579f77SDag-Erling Smørgrav {
313b7579f77SDag-Erling Smørgrav 	/* do not log transient errors (unless high verbosity) */
314b7579f77SDag-Erling Smørgrav #if defined(ENETUNREACH) || defined(EHOSTDOWN) || defined(EHOSTUNREACH) || defined(ENETDOWN)
315b7579f77SDag-Erling Smørgrav 	switch(errno) {
316b7579f77SDag-Erling Smørgrav #  ifdef ENETUNREACH
317b7579f77SDag-Erling Smørgrav 		case ENETUNREACH:
318b7579f77SDag-Erling Smørgrav #  endif
319b7579f77SDag-Erling Smørgrav #  ifdef EHOSTDOWN
320b7579f77SDag-Erling Smørgrav 		case EHOSTDOWN:
321b7579f77SDag-Erling Smørgrav #  endif
322b7579f77SDag-Erling Smørgrav #  ifdef EHOSTUNREACH
323b7579f77SDag-Erling Smørgrav 		case EHOSTUNREACH:
324b7579f77SDag-Erling Smørgrav #  endif
325b7579f77SDag-Erling Smørgrav #  ifdef ENETDOWN
326b7579f77SDag-Erling Smørgrav 		case ENETDOWN:
327b7579f77SDag-Erling Smørgrav #  endif
3285469a995SCy Schubert 		case EPERM:
32924e36522SCy Schubert 		case EACCES:
330b7579f77SDag-Erling Smørgrav 			if(verbosity < VERB_ALGO)
331b7579f77SDag-Erling Smørgrav 				return 0;
332b7579f77SDag-Erling Smørgrav 		default:
333b7579f77SDag-Erling Smørgrav 			break;
334b7579f77SDag-Erling Smørgrav 	}
335b7579f77SDag-Erling Smørgrav #endif
33617d15b25SDag-Erling Smørgrav 	/* permission denied is gotten for every send if the
33717d15b25SDag-Erling Smørgrav 	 * network is disconnected (on some OS), squelch it */
338f61ef7f6SDag-Erling Smørgrav 	if( ((errno == EPERM)
339f61ef7f6SDag-Erling Smørgrav #  ifdef EADDRNOTAVAIL
340f61ef7f6SDag-Erling Smørgrav 		/* 'Cannot assign requested address' also when disconnected */
341f61ef7f6SDag-Erling Smørgrav 		|| (errno == EADDRNOTAVAIL)
342f61ef7f6SDag-Erling Smørgrav #  endif
3435469a995SCy Schubert 		) && verbosity < VERB_ALGO)
34417d15b25SDag-Erling Smørgrav 		return 0;
34557bddd21SDag-Erling Smørgrav #  ifdef EADDRINUSE
34657bddd21SDag-Erling Smørgrav 	/* If SO_REUSEADDR is set, we could try to connect to the same server
34757bddd21SDag-Erling Smørgrav 	 * from the same source port twice. */
34857bddd21SDag-Erling Smørgrav 	if(errno == EADDRINUSE && verbosity < VERB_DETAIL)
34957bddd21SDag-Erling Smørgrav 		return 0;
35057bddd21SDag-Erling Smørgrav #  endif
351b7579f77SDag-Erling Smørgrav 	/* squelch errors where people deploy AAAA ::ffff:bla for
352b7579f77SDag-Erling Smørgrav 	 * authority servers, which we try for intranets. */
353b7579f77SDag-Erling Smørgrav 	if(errno == EINVAL && addr_is_ip4mapped(
354b7579f77SDag-Erling Smørgrav 		(struct sockaddr_storage*)addr, addrlen) &&
355b7579f77SDag-Erling Smørgrav 		verbosity < VERB_DETAIL)
356b7579f77SDag-Erling Smørgrav 		return 0;
357b7579f77SDag-Erling Smørgrav 	/* SO_BROADCAST sockopt can give access to 255.255.255.255,
358b7579f77SDag-Erling Smørgrav 	 * but a dns cache does not need it. */
359b7579f77SDag-Erling Smørgrav 	if(errno == EACCES && addr_is_broadcast(
360b7579f77SDag-Erling Smørgrav 		(struct sockaddr_storage*)addr, addrlen) &&
361b7579f77SDag-Erling Smørgrav 		verbosity < VERB_DETAIL)
362b7579f77SDag-Erling Smørgrav 		return 0;
363b7579f77SDag-Erling Smørgrav 	return 1;
364b7579f77SDag-Erling Smørgrav }
365b7579f77SDag-Erling Smørgrav 
366b7579f77SDag-Erling Smørgrav int tcp_connect_errno_needs_log(struct sockaddr* addr, socklen_t addrlen)
367b7579f77SDag-Erling Smørgrav {
368b7579f77SDag-Erling Smørgrav 	return udp_send_errno_needs_log(addr, addrlen);
369b7579f77SDag-Erling Smørgrav }
370b7579f77SDag-Erling Smørgrav 
371b7579f77SDag-Erling Smørgrav /* send a UDP reply */
372b7579f77SDag-Erling Smørgrav int
37317d15b25SDag-Erling Smørgrav comm_point_send_udp_msg(struct comm_point *c, sldns_buffer* packet,
3747341cb0cSXin LI 	struct sockaddr* addr, socklen_t addrlen, int is_connected)
375b7579f77SDag-Erling Smørgrav {
376b7579f77SDag-Erling Smørgrav 	ssize_t sent;
377b7579f77SDag-Erling Smørgrav 	log_assert(c->fd != -1);
378b7579f77SDag-Erling Smørgrav #ifdef UNBOUND_DEBUG
37917d15b25SDag-Erling Smørgrav 	if(sldns_buffer_remaining(packet) == 0)
380b7579f77SDag-Erling Smørgrav 		log_err("error: send empty UDP packet");
381b7579f77SDag-Erling Smørgrav #endif
382b7579f77SDag-Erling Smørgrav 	log_assert(addr && addrlen > 0);
3837341cb0cSXin LI 	if(!is_connected) {
38417d15b25SDag-Erling Smørgrav 		sent = sendto(c->fd, (void*)sldns_buffer_begin(packet),
38517d15b25SDag-Erling Smørgrav 			sldns_buffer_remaining(packet), 0,
386b7579f77SDag-Erling Smørgrav 			addr, addrlen);
387369c6923SCy Schubert 	} else {
388369c6923SCy Schubert 		sent = send(c->fd, (void*)sldns_buffer_begin(packet),
389369c6923SCy Schubert 			sldns_buffer_remaining(packet), 0);
390369c6923SCy Schubert 	}
391b7579f77SDag-Erling Smørgrav 	if(sent == -1) {
392f61ef7f6SDag-Erling Smørgrav 		/* try again and block, waiting for IO to complete,
393f61ef7f6SDag-Erling Smørgrav 		 * we want to send the answer, and we will wait for
394f61ef7f6SDag-Erling Smørgrav 		 * the ethernet interface buffer to have space. */
395f61ef7f6SDag-Erling Smørgrav #ifndef USE_WINSOCK
396865f46b2SCy Schubert 		if(errno == EAGAIN || errno == EINTR ||
397f61ef7f6SDag-Erling Smørgrav #  ifdef EWOULDBLOCK
398f61ef7f6SDag-Erling Smørgrav 			errno == EWOULDBLOCK ||
399f61ef7f6SDag-Erling Smørgrav #  endif
400f61ef7f6SDag-Erling Smørgrav 			errno == ENOBUFS) {
401f61ef7f6SDag-Erling Smørgrav #else
402f61ef7f6SDag-Erling Smørgrav 		if(WSAGetLastError() == WSAEINPROGRESS ||
403865f46b2SCy Schubert 			WSAGetLastError() == WSAEINTR ||
404f61ef7f6SDag-Erling Smørgrav 			WSAGetLastError() == WSAENOBUFS ||
405f61ef7f6SDag-Erling Smørgrav 			WSAGetLastError() == WSAEWOULDBLOCK) {
406f61ef7f6SDag-Erling Smørgrav #endif
4076e71235eSCy Schubert 			int retries = 0;
408865f46b2SCy Schubert 			/* if we set the fd blocking, other threads suddenly
409865f46b2SCy Schubert 			 * have a blocking fd that they operate on */
4106e71235eSCy Schubert 			while(sent == -1 && retries < SEND_BLOCKED_MAX_RETRY && (
411865f46b2SCy Schubert #ifndef USE_WINSOCK
412865f46b2SCy Schubert 				errno == EAGAIN || errno == EINTR ||
413865f46b2SCy Schubert #  ifdef EWOULDBLOCK
414865f46b2SCy Schubert 				errno == EWOULDBLOCK ||
415865f46b2SCy Schubert #  endif
416865f46b2SCy Schubert 				errno == ENOBUFS
417865f46b2SCy Schubert #else
418865f46b2SCy Schubert 				WSAGetLastError() == WSAEINPROGRESS ||
419865f46b2SCy Schubert 				WSAGetLastError() == WSAEINTR ||
420865f46b2SCy Schubert 				WSAGetLastError() == WSAENOBUFS ||
421865f46b2SCy Schubert 				WSAGetLastError() == WSAEWOULDBLOCK
422865f46b2SCy Schubert #endif
423865f46b2SCy Schubert 			)) {
424865f46b2SCy Schubert #if defined(HAVE_POLL) || defined(USE_WINSOCK)
4256e71235eSCy Schubert 				int send_nobufs = (
4266e71235eSCy Schubert #ifndef USE_WINSOCK
4276e71235eSCy Schubert 					errno == ENOBUFS
4286e71235eSCy Schubert #else
4296e71235eSCy Schubert 					WSAGetLastError() == WSAENOBUFS
4306e71235eSCy Schubert #endif
4316e71235eSCy Schubert 				);
432865f46b2SCy Schubert 				struct pollfd p;
433865f46b2SCy Schubert 				int pret;
434865f46b2SCy Schubert 				memset(&p, 0, sizeof(p));
435865f46b2SCy Schubert 				p.fd = c->fd;
436865f46b2SCy Schubert 				p.events = POLLOUT | POLLERR | POLLHUP;
437865f46b2SCy Schubert #  ifndef USE_WINSOCK
438865f46b2SCy Schubert 				pret = poll(&p, 1, SEND_BLOCKED_WAIT_TIMEOUT);
439865f46b2SCy Schubert #  else
440865f46b2SCy Schubert 				pret = WSAPoll(&p, 1,
441865f46b2SCy Schubert 					SEND_BLOCKED_WAIT_TIMEOUT);
442865f46b2SCy Schubert #  endif
443865f46b2SCy Schubert 				if(pret == 0) {
444865f46b2SCy Schubert 					/* timer expired */
445865f46b2SCy Schubert 					struct comm_base* b = c->ev->base;
446865f46b2SCy Schubert 					if(b->eb->last_writewait_log+SLOW_LOG_TIME <=
447865f46b2SCy Schubert 						b->eb->secs) {
448865f46b2SCy Schubert 						b->eb->last_writewait_log = b->eb->secs;
449865f46b2SCy Schubert 						verbose(VERB_OPS, "send udp blocked "
450865f46b2SCy Schubert 							"for long, dropping packet.");
451865f46b2SCy Schubert 					}
452865f46b2SCy Schubert 					return 0;
453865f46b2SCy Schubert 				} else if(pret < 0 &&
454865f46b2SCy Schubert #ifndef USE_WINSOCK
455865f46b2SCy Schubert 					errno != EAGAIN && errno != EINTR &&
456865f46b2SCy Schubert #  ifdef EWOULDBLOCK
457865f46b2SCy Schubert 					errno != EWOULDBLOCK &&
458865f46b2SCy Schubert #  endif
459865f46b2SCy Schubert 					errno != ENOBUFS
460865f46b2SCy Schubert #else
461865f46b2SCy Schubert 					WSAGetLastError() != WSAEINPROGRESS &&
462865f46b2SCy Schubert 					WSAGetLastError() != WSAEINTR &&
463865f46b2SCy Schubert 					WSAGetLastError() != WSAENOBUFS &&
464865f46b2SCy Schubert 					WSAGetLastError() != WSAEWOULDBLOCK
465865f46b2SCy Schubert #endif
466865f46b2SCy Schubert 					) {
467865f46b2SCy Schubert 					log_err("poll udp out failed: %s",
468865f46b2SCy Schubert 						sock_strerror(errno));
469865f46b2SCy Schubert 					return 0;
4706e71235eSCy Schubert 				} else if((pret < 0 &&
4716e71235eSCy Schubert #ifndef USE_WINSOCK
4726e71235eSCy Schubert 					errno == ENOBUFS
4736e71235eSCy Schubert #else
4746e71235eSCy Schubert 					WSAGetLastError() == WSAENOBUFS
4756e71235eSCy Schubert #endif
4766e71235eSCy Schubert 					) || (send_nobufs && retries > 0)) {
4776e71235eSCy Schubert 					/* ENOBUFS, and poll returned without
4786e71235eSCy Schubert 					 * a timeout. Or the retried send call
4796e71235eSCy Schubert 					 * returned ENOBUFS. It is good to
4806e71235eSCy Schubert 					 * wait a bit for the error to clear. */
4816e71235eSCy Schubert 					/* The timeout is 20*(2^(retries+1)),
4826e71235eSCy Schubert 					 * it increases exponentially, starting
4836e71235eSCy Schubert 					 * at 40 msec. After 5 tries, 1240 msec
4846e71235eSCy Schubert 					 * have passed in total, when poll
4856e71235eSCy Schubert 					 * returned the error, and 1200 msec
4866e71235eSCy Schubert 					 * when send returned the errors. */
4876e71235eSCy Schubert #ifndef USE_WINSOCK
4886e71235eSCy Schubert 					pret = poll(NULL, 0, (SEND_BLOCKED_WAIT_TIMEOUT/10)<<(retries+1));
4896e71235eSCy Schubert #else
4906e71235eSCy Schubert 					pret = WSAPoll(NULL, 0, (SEND_BLOCKED_WAIT_TIMEOUT/10)<<(retries+1));
4916e71235eSCy Schubert #endif
4926e71235eSCy Schubert 					if(pret < 0 &&
4936e71235eSCy Schubert #ifndef USE_WINSOCK
4946e71235eSCy Schubert 						errno != EAGAIN && errno != EINTR &&
4956e71235eSCy Schubert #  ifdef EWOULDBLOCK
4966e71235eSCy Schubert 						errno != EWOULDBLOCK &&
4976e71235eSCy Schubert #  endif
4986e71235eSCy Schubert 						errno != ENOBUFS
4996e71235eSCy Schubert #else
5006e71235eSCy Schubert 						WSAGetLastError() != WSAEINPROGRESS &&
5016e71235eSCy Schubert 						WSAGetLastError() != WSAEINTR &&
5026e71235eSCy Schubert 						WSAGetLastError() != WSAENOBUFS &&
5036e71235eSCy Schubert 						WSAGetLastError() != WSAEWOULDBLOCK
5046e71235eSCy Schubert #endif
5056e71235eSCy Schubert 					) {
5066e71235eSCy Schubert 						log_err("poll udp out timer failed: %s",
5076e71235eSCy Schubert 							sock_strerror(errno));
5086e71235eSCy Schubert 					}
509865f46b2SCy Schubert 				}
510865f46b2SCy Schubert #endif /* defined(HAVE_POLL) || defined(USE_WINSOCK) */
5116e71235eSCy Schubert 				retries++;
5127341cb0cSXin LI 				if (!is_connected) {
513f61ef7f6SDag-Erling Smørgrav 					sent = sendto(c->fd, (void*)sldns_buffer_begin(packet),
514f61ef7f6SDag-Erling Smørgrav 						sldns_buffer_remaining(packet), 0,
515f61ef7f6SDag-Erling Smørgrav 						addr, addrlen);
5167341cb0cSXin LI 				} else {
5177341cb0cSXin LI 					sent = send(c->fd, (void*)sldns_buffer_begin(packet),
5187341cb0cSXin LI 						sldns_buffer_remaining(packet), 0);
5197341cb0cSXin LI 				}
520865f46b2SCy Schubert 			}
521f61ef7f6SDag-Erling Smørgrav 		}
522f61ef7f6SDag-Erling Smørgrav 	}
523f61ef7f6SDag-Erling Smørgrav 	if(sent == -1) {
524b7579f77SDag-Erling Smørgrav 		if(!udp_send_errno_needs_log(addr, addrlen))
525b7579f77SDag-Erling Smørgrav 			return 0;
5267341cb0cSXin LI 		if (!is_connected) {
527c0caa2e2SCy Schubert 			verbose(VERB_OPS, "sendto failed: %s", sock_strerror(errno));
5287341cb0cSXin LI 		} else {
5297341cb0cSXin LI 			verbose(VERB_OPS, "send failed: %s", sock_strerror(errno));
5307341cb0cSXin LI 		}
531f44e67d1SCy Schubert 		if(addr)
532b7579f77SDag-Erling Smørgrav 			log_addr(VERB_OPS, "remote address is",
533b7579f77SDag-Erling Smørgrav 				(struct sockaddr_storage*)addr, addrlen);
534b7579f77SDag-Erling Smørgrav 		return 0;
53517d15b25SDag-Erling Smørgrav 	} else if((size_t)sent != sldns_buffer_remaining(packet)) {
536b7579f77SDag-Erling Smørgrav 		log_err("sent %d in place of %d bytes",
53717d15b25SDag-Erling Smørgrav 			(int)sent, (int)sldns_buffer_remaining(packet));
538b7579f77SDag-Erling Smørgrav 		return 0;
539b7579f77SDag-Erling Smørgrav 	}
540b7579f77SDag-Erling Smørgrav 	return 1;
541b7579f77SDag-Erling Smørgrav }
542b7579f77SDag-Erling Smørgrav 
543b7579f77SDag-Erling Smørgrav #if defined(AF_INET6) && defined(IPV6_PKTINFO) && (defined(HAVE_RECVMSG) || defined(HAVE_SENDMSG))
544b7579f77SDag-Erling Smørgrav /** print debug ancillary info */
545b7579f77SDag-Erling Smørgrav static void p_ancil(const char* str, struct comm_reply* r)
546b7579f77SDag-Erling Smørgrav {
547b7579f77SDag-Erling Smørgrav 	if(r->srctype != 4 && r->srctype != 6) {
548b7579f77SDag-Erling Smørgrav 		log_info("%s: unknown srctype %d", str, r->srctype);
549b7579f77SDag-Erling Smørgrav 		return;
550b7579f77SDag-Erling Smørgrav 	}
5515469a995SCy Schubert 
552b7579f77SDag-Erling Smørgrav 	if(r->srctype == 6) {
5535469a995SCy Schubert #ifdef IPV6_PKTINFO
554b7579f77SDag-Erling Smørgrav 		char buf[1024];
555b7579f77SDag-Erling Smørgrav 		if(inet_ntop(AF_INET6, &r->pktinfo.v6info.ipi6_addr,
556b7579f77SDag-Erling Smørgrav 			buf, (socklen_t)sizeof(buf)) == 0) {
55717d15b25SDag-Erling Smørgrav 			(void)strlcpy(buf, "(inet_ntop error)", sizeof(buf));
558b7579f77SDag-Erling Smørgrav 		}
559b7579f77SDag-Erling Smørgrav 		buf[sizeof(buf)-1]=0;
560b7579f77SDag-Erling Smørgrav 		log_info("%s: %s %d", str, buf, r->pktinfo.v6info.ipi6_ifindex);
5615469a995SCy Schubert #endif
562b7579f77SDag-Erling Smørgrav 	} else if(r->srctype == 4) {
563b7579f77SDag-Erling Smørgrav #ifdef IP_PKTINFO
564b7579f77SDag-Erling Smørgrav 		char buf1[1024], buf2[1024];
565b7579f77SDag-Erling Smørgrav 		if(inet_ntop(AF_INET, &r->pktinfo.v4info.ipi_addr,
566b7579f77SDag-Erling Smørgrav 			buf1, (socklen_t)sizeof(buf1)) == 0) {
56717d15b25SDag-Erling Smørgrav 			(void)strlcpy(buf1, "(inet_ntop error)", sizeof(buf1));
568b7579f77SDag-Erling Smørgrav 		}
569b7579f77SDag-Erling Smørgrav 		buf1[sizeof(buf1)-1]=0;
570b7579f77SDag-Erling Smørgrav #ifdef HAVE_STRUCT_IN_PKTINFO_IPI_SPEC_DST
571b7579f77SDag-Erling Smørgrav 		if(inet_ntop(AF_INET, &r->pktinfo.v4info.ipi_spec_dst,
572b7579f77SDag-Erling Smørgrav 			buf2, (socklen_t)sizeof(buf2)) == 0) {
57317d15b25SDag-Erling Smørgrav 			(void)strlcpy(buf2, "(inet_ntop error)", sizeof(buf2));
574b7579f77SDag-Erling Smørgrav 		}
575b7579f77SDag-Erling Smørgrav 		buf2[sizeof(buf2)-1]=0;
576b7579f77SDag-Erling Smørgrav #else
577b7579f77SDag-Erling Smørgrav 		buf2[0]=0;
578b7579f77SDag-Erling Smørgrav #endif
579b7579f77SDag-Erling Smørgrav 		log_info("%s: %d %s %s", str, r->pktinfo.v4info.ipi_ifindex,
580b7579f77SDag-Erling Smørgrav 			buf1, buf2);
581b7579f77SDag-Erling Smørgrav #elif defined(IP_RECVDSTADDR)
582b7579f77SDag-Erling Smørgrav 		char buf1[1024];
583b7579f77SDag-Erling Smørgrav 		if(inet_ntop(AF_INET, &r->pktinfo.v4addr,
584b7579f77SDag-Erling Smørgrav 			buf1, (socklen_t)sizeof(buf1)) == 0) {
58517d15b25SDag-Erling Smørgrav 			(void)strlcpy(buf1, "(inet_ntop error)", sizeof(buf1));
586b7579f77SDag-Erling Smørgrav 		}
587b7579f77SDag-Erling Smørgrav 		buf1[sizeof(buf1)-1]=0;
588b7579f77SDag-Erling Smørgrav 		log_info("%s: %s", str, buf1);
589b7579f77SDag-Erling Smørgrav #endif /* IP_PKTINFO or PI_RECVDSTDADDR */
590b7579f77SDag-Erling Smørgrav 	}
591b7579f77SDag-Erling Smørgrav }
592b7579f77SDag-Erling Smørgrav #endif /* AF_INET6 && IPV6_PKTINFO && HAVE_RECVMSG||HAVE_SENDMSG */
593b7579f77SDag-Erling Smørgrav 
594b7579f77SDag-Erling Smørgrav /** send a UDP reply over specified interface*/
595b7579f77SDag-Erling Smørgrav static int
59617d15b25SDag-Erling Smørgrav comm_point_send_udp_msg_if(struct comm_point *c, sldns_buffer* packet,
597b7579f77SDag-Erling Smørgrav 	struct sockaddr* addr, socklen_t addrlen, struct comm_reply* r)
598b7579f77SDag-Erling Smørgrav {
599b7579f77SDag-Erling Smørgrav #if defined(AF_INET6) && defined(IPV6_PKTINFO) && defined(HAVE_SENDMSG)
600b7579f77SDag-Erling Smørgrav 	ssize_t sent;
601b7579f77SDag-Erling Smørgrav 	struct msghdr msg;
602b7579f77SDag-Erling Smørgrav 	struct iovec iov[1];
60325039b37SCy Schubert 	union {
60425039b37SCy Schubert 		struct cmsghdr hdr;
60525039b37SCy Schubert 		char buf[256];
60625039b37SCy Schubert 	} control;
607b7579f77SDag-Erling Smørgrav #ifndef S_SPLINT_S
608b7579f77SDag-Erling Smørgrav 	struct cmsghdr *cmsg;
609b7579f77SDag-Erling Smørgrav #endif /* S_SPLINT_S */
610b7579f77SDag-Erling Smørgrav 
611b7579f77SDag-Erling Smørgrav 	log_assert(c->fd != -1);
612b7579f77SDag-Erling Smørgrav #ifdef UNBOUND_DEBUG
61317d15b25SDag-Erling Smørgrav 	if(sldns_buffer_remaining(packet) == 0)
614b7579f77SDag-Erling Smørgrav 		log_err("error: send empty UDP packet");
615b7579f77SDag-Erling Smørgrav #endif
616b7579f77SDag-Erling Smørgrav 	log_assert(addr && addrlen > 0);
617b7579f77SDag-Erling Smørgrav 
618b7579f77SDag-Erling Smørgrav 	msg.msg_name = addr;
619b7579f77SDag-Erling Smørgrav 	msg.msg_namelen = addrlen;
62017d15b25SDag-Erling Smørgrav 	iov[0].iov_base = sldns_buffer_begin(packet);
62117d15b25SDag-Erling Smørgrav 	iov[0].iov_len = sldns_buffer_remaining(packet);
622b7579f77SDag-Erling Smørgrav 	msg.msg_iov = iov;
623b7579f77SDag-Erling Smørgrav 	msg.msg_iovlen = 1;
62425039b37SCy Schubert 	msg.msg_control = control.buf;
625b7579f77SDag-Erling Smørgrav #ifndef S_SPLINT_S
62625039b37SCy Schubert 	msg.msg_controllen = sizeof(control.buf);
627b7579f77SDag-Erling Smørgrav #endif /* S_SPLINT_S */
628b7579f77SDag-Erling Smørgrav 	msg.msg_flags = 0;
629b7579f77SDag-Erling Smørgrav 
630b7579f77SDag-Erling Smørgrav #ifndef S_SPLINT_S
631b7579f77SDag-Erling Smørgrav 	cmsg = CMSG_FIRSTHDR(&msg);
632b7579f77SDag-Erling Smørgrav 	if(r->srctype == 4) {
633b7579f77SDag-Erling Smørgrav #ifdef IP_PKTINFO
63409a3aaf3SDag-Erling Smørgrav 		void* cmsg_data;
635b7579f77SDag-Erling Smørgrav 		msg.msg_controllen = CMSG_SPACE(sizeof(struct in_pktinfo));
63625039b37SCy Schubert 		log_assert(msg.msg_controllen <= sizeof(control.buf));
637b7579f77SDag-Erling Smørgrav 		cmsg->cmsg_level = IPPROTO_IP;
638b7579f77SDag-Erling Smørgrav 		cmsg->cmsg_type = IP_PKTINFO;
639b7579f77SDag-Erling Smørgrav 		memmove(CMSG_DATA(cmsg), &r->pktinfo.v4info,
640b7579f77SDag-Erling Smørgrav 			sizeof(struct in_pktinfo));
64109a3aaf3SDag-Erling Smørgrav 		/* unset the ifindex to not bypass the routing tables */
64209a3aaf3SDag-Erling Smørgrav 		cmsg_data = CMSG_DATA(cmsg);
64309a3aaf3SDag-Erling Smørgrav 		((struct in_pktinfo *) cmsg_data)->ipi_ifindex = 0;
644b7579f77SDag-Erling Smørgrav 		cmsg->cmsg_len = CMSG_LEN(sizeof(struct in_pktinfo));
6458f76bb7dSCy Schubert 		/* zero the padding bytes inserted by the CMSG_LEN */
6468f76bb7dSCy Schubert 		if(sizeof(struct in_pktinfo) < cmsg->cmsg_len)
6478f76bb7dSCy Schubert 			memset(((uint8_t*)(CMSG_DATA(cmsg))) +
6488f76bb7dSCy Schubert 				sizeof(struct in_pktinfo), 0, cmsg->cmsg_len
6498f76bb7dSCy Schubert 				- sizeof(struct in_pktinfo));
650b7579f77SDag-Erling Smørgrav #elif defined(IP_SENDSRCADDR)
651b7579f77SDag-Erling Smørgrav 		msg.msg_controllen = CMSG_SPACE(sizeof(struct in_addr));
65225039b37SCy Schubert 		log_assert(msg.msg_controllen <= sizeof(control.buf));
653b7579f77SDag-Erling Smørgrav 		cmsg->cmsg_level = IPPROTO_IP;
654b7579f77SDag-Erling Smørgrav 		cmsg->cmsg_type = IP_SENDSRCADDR;
655b7579f77SDag-Erling Smørgrav 		memmove(CMSG_DATA(cmsg), &r->pktinfo.v4addr,
656b7579f77SDag-Erling Smørgrav 			sizeof(struct in_addr));
657b7579f77SDag-Erling Smørgrav 		cmsg->cmsg_len = CMSG_LEN(sizeof(struct in_addr));
6588f76bb7dSCy Schubert 		/* zero the padding bytes inserted by the CMSG_LEN */
6598f76bb7dSCy Schubert 		if(sizeof(struct in_addr) < cmsg->cmsg_len)
6608f76bb7dSCy Schubert 			memset(((uint8_t*)(CMSG_DATA(cmsg))) +
6618f76bb7dSCy Schubert 				sizeof(struct in_addr), 0, cmsg->cmsg_len
6628f76bb7dSCy Schubert 				- sizeof(struct in_addr));
663b7579f77SDag-Erling Smørgrav #else
664b7579f77SDag-Erling Smørgrav 		verbose(VERB_ALGO, "no IP_PKTINFO or IP_SENDSRCADDR");
665b7579f77SDag-Erling Smørgrav 		msg.msg_control = NULL;
666b7579f77SDag-Erling Smørgrav #endif /* IP_PKTINFO or IP_SENDSRCADDR */
667b7579f77SDag-Erling Smørgrav 	} else if(r->srctype == 6) {
66809a3aaf3SDag-Erling Smørgrav 		void* cmsg_data;
669b7579f77SDag-Erling Smørgrav 		msg.msg_controllen = CMSG_SPACE(sizeof(struct in6_pktinfo));
67025039b37SCy Schubert 		log_assert(msg.msg_controllen <= sizeof(control.buf));
671b7579f77SDag-Erling Smørgrav 		cmsg->cmsg_level = IPPROTO_IPV6;
672b7579f77SDag-Erling Smørgrav 		cmsg->cmsg_type = IPV6_PKTINFO;
673b7579f77SDag-Erling Smørgrav 		memmove(CMSG_DATA(cmsg), &r->pktinfo.v6info,
674b7579f77SDag-Erling Smørgrav 			sizeof(struct in6_pktinfo));
67509a3aaf3SDag-Erling Smørgrav 		/* unset the ifindex to not bypass the routing tables */
67609a3aaf3SDag-Erling Smørgrav 		cmsg_data = CMSG_DATA(cmsg);
67709a3aaf3SDag-Erling Smørgrav 		((struct in6_pktinfo *) cmsg_data)->ipi6_ifindex = 0;
678b7579f77SDag-Erling Smørgrav 		cmsg->cmsg_len = CMSG_LEN(sizeof(struct in6_pktinfo));
6798f76bb7dSCy Schubert 		/* zero the padding bytes inserted by the CMSG_LEN */
6808f76bb7dSCy Schubert 		if(sizeof(struct in6_pktinfo) < cmsg->cmsg_len)
6818f76bb7dSCy Schubert 			memset(((uint8_t*)(CMSG_DATA(cmsg))) +
6828f76bb7dSCy Schubert 				sizeof(struct in6_pktinfo), 0, cmsg->cmsg_len
6838f76bb7dSCy Schubert 				- sizeof(struct in6_pktinfo));
684b7579f77SDag-Erling Smørgrav 	} else {
685b7579f77SDag-Erling Smørgrav 		/* try to pass all 0 to use default route */
686b7579f77SDag-Erling Smørgrav 		msg.msg_controllen = CMSG_SPACE(sizeof(struct in6_pktinfo));
68725039b37SCy Schubert 		log_assert(msg.msg_controllen <= sizeof(control.buf));
688b7579f77SDag-Erling Smørgrav 		cmsg->cmsg_level = IPPROTO_IPV6;
689b7579f77SDag-Erling Smørgrav 		cmsg->cmsg_type = IPV6_PKTINFO;
690b7579f77SDag-Erling Smørgrav 		memset(CMSG_DATA(cmsg), 0, sizeof(struct in6_pktinfo));
691b7579f77SDag-Erling Smørgrav 		cmsg->cmsg_len = CMSG_LEN(sizeof(struct in6_pktinfo));
6928f76bb7dSCy Schubert 		/* zero the padding bytes inserted by the CMSG_LEN */
6938f76bb7dSCy Schubert 		if(sizeof(struct in6_pktinfo) < cmsg->cmsg_len)
6948f76bb7dSCy Schubert 			memset(((uint8_t*)(CMSG_DATA(cmsg))) +
6958f76bb7dSCy Schubert 				sizeof(struct in6_pktinfo), 0, cmsg->cmsg_len
6968f76bb7dSCy Schubert 				- sizeof(struct in6_pktinfo));
697b7579f77SDag-Erling Smørgrav 	}
698b7579f77SDag-Erling Smørgrav #endif /* S_SPLINT_S */
6998f76bb7dSCy Schubert 	if(verbosity >= VERB_ALGO && r->srctype != 0)
700b7579f77SDag-Erling Smørgrav 		p_ancil("send_udp over interface", r);
701b7579f77SDag-Erling Smørgrav 	sent = sendmsg(c->fd, &msg, 0);
702b7579f77SDag-Erling Smørgrav 	if(sent == -1) {
703f61ef7f6SDag-Erling Smørgrav 		/* try again and block, waiting for IO to complete,
704f61ef7f6SDag-Erling Smørgrav 		 * we want to send the answer, and we will wait for
705f61ef7f6SDag-Erling Smørgrav 		 * the ethernet interface buffer to have space. */
706f61ef7f6SDag-Erling Smørgrav #ifndef USE_WINSOCK
707865f46b2SCy Schubert 		if(errno == EAGAIN || errno == EINTR ||
708f61ef7f6SDag-Erling Smørgrav #  ifdef EWOULDBLOCK
709f61ef7f6SDag-Erling Smørgrav 			errno == EWOULDBLOCK ||
710f61ef7f6SDag-Erling Smørgrav #  endif
711f61ef7f6SDag-Erling Smørgrav 			errno == ENOBUFS) {
712f61ef7f6SDag-Erling Smørgrav #else
713f61ef7f6SDag-Erling Smørgrav 		if(WSAGetLastError() == WSAEINPROGRESS ||
714865f46b2SCy Schubert 			WSAGetLastError() == WSAEINTR ||
715f61ef7f6SDag-Erling Smørgrav 			WSAGetLastError() == WSAENOBUFS ||
716f61ef7f6SDag-Erling Smørgrav 			WSAGetLastError() == WSAEWOULDBLOCK) {
717f61ef7f6SDag-Erling Smørgrav #endif
7186e71235eSCy Schubert 			int retries = 0;
7196e71235eSCy Schubert 			while(sent == -1 && retries < SEND_BLOCKED_MAX_RETRY && (
720865f46b2SCy Schubert #ifndef USE_WINSOCK
721865f46b2SCy Schubert 				errno == EAGAIN || errno == EINTR ||
722865f46b2SCy Schubert #  ifdef EWOULDBLOCK
723865f46b2SCy Schubert 				errno == EWOULDBLOCK ||
724865f46b2SCy Schubert #  endif
725865f46b2SCy Schubert 				errno == ENOBUFS
726865f46b2SCy Schubert #else
727865f46b2SCy Schubert 				WSAGetLastError() == WSAEINPROGRESS ||
728865f46b2SCy Schubert 				WSAGetLastError() == WSAEINTR ||
729865f46b2SCy Schubert 				WSAGetLastError() == WSAENOBUFS ||
730865f46b2SCy Schubert 				WSAGetLastError() == WSAEWOULDBLOCK
731865f46b2SCy Schubert #endif
732865f46b2SCy Schubert 			)) {
733865f46b2SCy Schubert #if defined(HAVE_POLL) || defined(USE_WINSOCK)
7346e71235eSCy Schubert 				int send_nobufs = (
7356e71235eSCy Schubert #ifndef USE_WINSOCK
7366e71235eSCy Schubert 					errno == ENOBUFS
7376e71235eSCy Schubert #else
7386e71235eSCy Schubert 					WSAGetLastError() == WSAENOBUFS
7396e71235eSCy Schubert #endif
7406e71235eSCy Schubert 				);
741865f46b2SCy Schubert 				struct pollfd p;
742865f46b2SCy Schubert 				int pret;
743865f46b2SCy Schubert 				memset(&p, 0, sizeof(p));
744865f46b2SCy Schubert 				p.fd = c->fd;
745865f46b2SCy Schubert 				p.events = POLLOUT | POLLERR | POLLHUP;
746865f46b2SCy Schubert #  ifndef USE_WINSOCK
747865f46b2SCy Schubert 				pret = poll(&p, 1, SEND_BLOCKED_WAIT_TIMEOUT);
748865f46b2SCy Schubert #  else
749865f46b2SCy Schubert 				pret = WSAPoll(&p, 1,
750865f46b2SCy Schubert 					SEND_BLOCKED_WAIT_TIMEOUT);
751865f46b2SCy Schubert #  endif
752865f46b2SCy Schubert 				if(pret == 0) {
753865f46b2SCy Schubert 					/* timer expired */
754865f46b2SCy Schubert 					struct comm_base* b = c->ev->base;
755865f46b2SCy Schubert 					if(b->eb->last_writewait_log+SLOW_LOG_TIME <=
756865f46b2SCy Schubert 						b->eb->secs) {
757865f46b2SCy Schubert 						b->eb->last_writewait_log = b->eb->secs;
758865f46b2SCy Schubert 						verbose(VERB_OPS, "send udp blocked "
759865f46b2SCy Schubert 							"for long, dropping packet.");
760865f46b2SCy Schubert 					}
761865f46b2SCy Schubert 					return 0;
762865f46b2SCy Schubert 				} else if(pret < 0 &&
763865f46b2SCy Schubert #ifndef USE_WINSOCK
764865f46b2SCy Schubert 					errno != EAGAIN && errno != EINTR &&
765865f46b2SCy Schubert #  ifdef EWOULDBLOCK
766865f46b2SCy Schubert 					errno != EWOULDBLOCK &&
767865f46b2SCy Schubert #  endif
768865f46b2SCy Schubert 					errno != ENOBUFS
769865f46b2SCy Schubert #else
770865f46b2SCy Schubert 					WSAGetLastError() != WSAEINPROGRESS &&
771865f46b2SCy Schubert 					WSAGetLastError() != WSAEINTR &&
772865f46b2SCy Schubert 					WSAGetLastError() != WSAENOBUFS &&
773865f46b2SCy Schubert 					WSAGetLastError() != WSAEWOULDBLOCK
774865f46b2SCy Schubert #endif
775865f46b2SCy Schubert 					) {
776865f46b2SCy Schubert 					log_err("poll udp out failed: %s",
777865f46b2SCy Schubert 						sock_strerror(errno));
778865f46b2SCy Schubert 					return 0;
7796e71235eSCy Schubert 				} else if((pret < 0 &&
7806e71235eSCy Schubert #ifndef USE_WINSOCK
7816e71235eSCy Schubert 					errno == ENOBUFS
7826e71235eSCy Schubert #else
7836e71235eSCy Schubert 					WSAGetLastError() == WSAENOBUFS
7846e71235eSCy Schubert #endif
7856e71235eSCy Schubert 					) || (send_nobufs && retries > 0)) {
7866e71235eSCy Schubert 					/* ENOBUFS, and poll returned without
7876e71235eSCy Schubert 					 * a timeout. Or the retried send call
7886e71235eSCy Schubert 					 * returned ENOBUFS. It is good to
7896e71235eSCy Schubert 					 * wait a bit for the error to clear. */
7906e71235eSCy Schubert 					/* The timeout is 20*(2^(retries+1)),
7916e71235eSCy Schubert 					 * it increases exponentially, starting
7926e71235eSCy Schubert 					 * at 40 msec. After 5 tries, 1240 msec
7936e71235eSCy Schubert 					 * have passed in total, when poll
7946e71235eSCy Schubert 					 * returned the error, and 1200 msec
7956e71235eSCy Schubert 					 * when send returned the errors. */
7966e71235eSCy Schubert #ifndef USE_WINSOCK
7976e71235eSCy Schubert 					pret = poll(NULL, 0, (SEND_BLOCKED_WAIT_TIMEOUT/10)<<(retries+1));
7986e71235eSCy Schubert #else
7996e71235eSCy Schubert 					pret = WSAPoll(NULL, 0, (SEND_BLOCKED_WAIT_TIMEOUT/10)<<(retries+1));
8006e71235eSCy Schubert #endif
8016e71235eSCy Schubert 					if(pret < 0 &&
8026e71235eSCy Schubert #ifndef USE_WINSOCK
8036e71235eSCy Schubert 						errno != EAGAIN && errno != EINTR &&
8046e71235eSCy Schubert #  ifdef EWOULDBLOCK
8056e71235eSCy Schubert 						errno != EWOULDBLOCK &&
8066e71235eSCy Schubert #  endif
8076e71235eSCy Schubert 						errno != ENOBUFS
8086e71235eSCy Schubert #else
8096e71235eSCy Schubert 						WSAGetLastError() != WSAEINPROGRESS &&
8106e71235eSCy Schubert 						WSAGetLastError() != WSAEINTR &&
8116e71235eSCy Schubert 						WSAGetLastError() != WSAENOBUFS &&
8126e71235eSCy Schubert 						WSAGetLastError() != WSAEWOULDBLOCK
8136e71235eSCy Schubert #endif
8146e71235eSCy Schubert 					) {
8156e71235eSCy Schubert 						log_err("poll udp out timer failed: %s",
8166e71235eSCy Schubert 							sock_strerror(errno));
8176e71235eSCy Schubert 					}
818865f46b2SCy Schubert 				}
819865f46b2SCy Schubert #endif /* defined(HAVE_POLL) || defined(USE_WINSOCK) */
8206e71235eSCy Schubert 				retries++;
821f61ef7f6SDag-Erling Smørgrav 				sent = sendmsg(c->fd, &msg, 0);
822865f46b2SCy Schubert 			}
823f61ef7f6SDag-Erling Smørgrav 		}
824f61ef7f6SDag-Erling Smørgrav 	}
825f61ef7f6SDag-Erling Smørgrav 	if(sent == -1) {
826b7579f77SDag-Erling Smørgrav 		if(!udp_send_errno_needs_log(addr, addrlen))
827b7579f77SDag-Erling Smørgrav 			return 0;
828b7579f77SDag-Erling Smørgrav 		verbose(VERB_OPS, "sendmsg failed: %s", strerror(errno));
829b7579f77SDag-Erling Smørgrav 		log_addr(VERB_OPS, "remote address is",
830b7579f77SDag-Erling Smørgrav 			(struct sockaddr_storage*)addr, addrlen);
831f61ef7f6SDag-Erling Smørgrav #ifdef __NetBSD__
832f61ef7f6SDag-Erling Smørgrav 		/* netbsd 7 has IP_PKTINFO for recv but not send */
833f61ef7f6SDag-Erling Smørgrav 		if(errno == EINVAL && r->srctype == 4)
834f61ef7f6SDag-Erling Smørgrav 			log_err("sendmsg: No support for sendmsg(IP_PKTINFO). "
835f61ef7f6SDag-Erling Smørgrav 				"Please disable interface-automatic");
836f61ef7f6SDag-Erling Smørgrav #endif
837b7579f77SDag-Erling Smørgrav 		return 0;
83817d15b25SDag-Erling Smørgrav 	} else if((size_t)sent != sldns_buffer_remaining(packet)) {
839b7579f77SDag-Erling Smørgrav 		log_err("sent %d in place of %d bytes",
84017d15b25SDag-Erling Smørgrav 			(int)sent, (int)sldns_buffer_remaining(packet));
841b7579f77SDag-Erling Smørgrav 		return 0;
842b7579f77SDag-Erling Smørgrav 	}
843b7579f77SDag-Erling Smørgrav 	return 1;
844b7579f77SDag-Erling Smørgrav #else
845b7579f77SDag-Erling Smørgrav 	(void)c;
846b7579f77SDag-Erling Smørgrav 	(void)packet;
847b7579f77SDag-Erling Smørgrav 	(void)addr;
848b7579f77SDag-Erling Smørgrav 	(void)addrlen;
849b7579f77SDag-Erling Smørgrav 	(void)r;
850b7579f77SDag-Erling Smørgrav 	log_err("sendmsg: IPV6_PKTINFO not supported");
851b7579f77SDag-Erling Smørgrav 	return 0;
852b7579f77SDag-Erling Smørgrav #endif /* AF_INET6 && IPV6_PKTINFO && HAVE_SENDMSG */
853b7579f77SDag-Erling Smørgrav }
854b7579f77SDag-Erling Smørgrav 
855369c6923SCy Schubert /** return true is UDP receive error needs to be logged */
856369c6923SCy Schubert static int udp_recv_needs_log(int err)
857369c6923SCy Schubert {
858369c6923SCy Schubert 	switch(err) {
859f44e67d1SCy Schubert 	case EACCES: /* some hosts send ICMP 'Permission Denied' */
860f44e67d1SCy Schubert #ifndef USE_WINSOCK
861369c6923SCy Schubert 	case ECONNREFUSED:
862369c6923SCy Schubert #  ifdef ENETUNREACH
863369c6923SCy Schubert 	case ENETUNREACH:
864369c6923SCy Schubert #  endif
865369c6923SCy Schubert #  ifdef EHOSTDOWN
866369c6923SCy Schubert 	case EHOSTDOWN:
867369c6923SCy Schubert #  endif
868369c6923SCy Schubert #  ifdef EHOSTUNREACH
869369c6923SCy Schubert 	case EHOSTUNREACH:
870369c6923SCy Schubert #  endif
871369c6923SCy Schubert #  ifdef ENETDOWN
872369c6923SCy Schubert 	case ENETDOWN:
873369c6923SCy Schubert #  endif
874f44e67d1SCy Schubert #else /* USE_WINSOCK */
875f44e67d1SCy Schubert 	case WSAECONNREFUSED:
876f44e67d1SCy Schubert 	case WSAENETUNREACH:
877f44e67d1SCy Schubert 	case WSAEHOSTDOWN:
878f44e67d1SCy Schubert 	case WSAEHOSTUNREACH:
879f44e67d1SCy Schubert 	case WSAENETDOWN:
880f44e67d1SCy Schubert #endif
881369c6923SCy Schubert 		if(verbosity >= VERB_ALGO)
882369c6923SCy Schubert 			return 1;
883369c6923SCy Schubert 		return 0;
884369c6923SCy Schubert 	default:
885369c6923SCy Schubert 		break;
886369c6923SCy Schubert 	}
887369c6923SCy Schubert 	return 1;
888369c6923SCy Schubert }
889369c6923SCy Schubert 
890865f46b2SCy Schubert /** Parses the PROXYv2 header from buf and updates the comm_reply struct.
891865f46b2SCy Schubert  *  Returns 1 on success, 0 on failure. */
892865f46b2SCy Schubert static int consume_pp2_header(struct sldns_buffer* buf, struct comm_reply* rep,
893865f46b2SCy Schubert 	int stream) {
894865f46b2SCy Schubert 	size_t size;
895103ba509SCy Schubert 	struct pp2_header *header;
896103ba509SCy Schubert 	int err = pp2_read_header(sldns_buffer_begin(buf),
897103ba509SCy Schubert 		sldns_buffer_remaining(buf));
898103ba509SCy Schubert 	if(err) return 0;
899103ba509SCy Schubert 	header = (struct pp2_header*)sldns_buffer_begin(buf);
900865f46b2SCy Schubert 	size = PP2_HEADER_SIZE + ntohs(header->len);
901865f46b2SCy Schubert 	if((header->ver_cmd & 0xF) == PP2_CMD_LOCAL) {
902865f46b2SCy Schubert 		/* A connection from the proxy itself.
903865f46b2SCy Schubert 		 * No need to do anything with addresses. */
904865f46b2SCy Schubert 		goto done;
905865f46b2SCy Schubert 	}
906103ba509SCy Schubert 	if(header->fam_prot == PP2_UNSPEC_UNSPEC) {
907865f46b2SCy Schubert 		/* Unspecified family and protocol. This could be used for
908865f46b2SCy Schubert 		 * health checks by proxies.
909865f46b2SCy Schubert 		 * No need to do anything with addresses. */
910865f46b2SCy Schubert 		goto done;
911865f46b2SCy Schubert 	}
912865f46b2SCy Schubert 	/* Read the proxied address */
913865f46b2SCy Schubert 	switch(header->fam_prot) {
914103ba509SCy Schubert 		case PP2_INET_STREAM:
915103ba509SCy Schubert 		case PP2_INET_DGRAM:
916865f46b2SCy Schubert 			{
917865f46b2SCy Schubert 			struct sockaddr_in* addr =
918865f46b2SCy Schubert 				(struct sockaddr_in*)&rep->client_addr;
919865f46b2SCy Schubert 			addr->sin_family = AF_INET;
920865f46b2SCy Schubert 			addr->sin_addr.s_addr = header->addr.addr4.src_addr;
921865f46b2SCy Schubert 			addr->sin_port = header->addr.addr4.src_port;
922865f46b2SCy Schubert 			rep->client_addrlen = (socklen_t)sizeof(struct sockaddr_in);
923865f46b2SCy Schubert 			}
924865f46b2SCy Schubert 			/* Ignore the destination address; it should be us. */
925865f46b2SCy Schubert 			break;
926103ba509SCy Schubert 		case PP2_INET6_STREAM:
927103ba509SCy Schubert 		case PP2_INET6_DGRAM:
928865f46b2SCy Schubert 			{
929865f46b2SCy Schubert 			struct sockaddr_in6* addr =
930865f46b2SCy Schubert 				(struct sockaddr_in6*)&rep->client_addr;
931865f46b2SCy Schubert 			memset(addr, 0, sizeof(*addr));
932865f46b2SCy Schubert 			addr->sin6_family = AF_INET6;
933865f46b2SCy Schubert 			memcpy(&addr->sin6_addr,
934865f46b2SCy Schubert 				header->addr.addr6.src_addr, 16);
935865f46b2SCy Schubert 			addr->sin6_port = header->addr.addr6.src_port;
936865f46b2SCy Schubert 			rep->client_addrlen = (socklen_t)sizeof(struct sockaddr_in6);
937865f46b2SCy Schubert 			}
938865f46b2SCy Schubert 			/* Ignore the destination address; it should be us. */
939865f46b2SCy Schubert 			break;
940103ba509SCy Schubert 		default:
941103ba509SCy Schubert 			log_err("proxy_protocol: unsupported family and "
942103ba509SCy Schubert 				"protocol 0x%x", (int)header->fam_prot);
943103ba509SCy Schubert 			return 0;
944865f46b2SCy Schubert 	}
945865f46b2SCy Schubert 	rep->is_proxied = 1;
946865f46b2SCy Schubert done:
947865f46b2SCy Schubert 	if(!stream) {
948865f46b2SCy Schubert 		/* We are reading a whole packet;
949865f46b2SCy Schubert 		 * Move the rest of the data to overwrite the PROXYv2 header */
950865f46b2SCy Schubert 		/* XXX can we do better to avoid memmove? */
9511838dec3SCy Schubert 		memmove(header, ((char*)header)+size,
952865f46b2SCy Schubert 			sldns_buffer_limit(buf)-size);
953865f46b2SCy Schubert 		sldns_buffer_set_limit(buf, sldns_buffer_limit(buf)-size);
954865f46b2SCy Schubert 	}
955865f46b2SCy Schubert 	return 1;
956865f46b2SCy Schubert }
957865f46b2SCy Schubert 
958103ba509SCy Schubert #if defined(AF_INET6) && defined(IPV6_PKTINFO) && defined(HAVE_RECVMSG)
959b7579f77SDag-Erling Smørgrav void
960b7579f77SDag-Erling Smørgrav comm_point_udp_ancil_callback(int fd, short event, void* arg)
961b7579f77SDag-Erling Smørgrav {
962b7579f77SDag-Erling Smørgrav 	struct comm_reply rep;
963b7579f77SDag-Erling Smørgrav 	struct msghdr msg;
964b7579f77SDag-Erling Smørgrav 	struct iovec iov[1];
965b7579f77SDag-Erling Smørgrav 	ssize_t rcv;
96625039b37SCy Schubert 	union {
96725039b37SCy Schubert 		struct cmsghdr hdr;
96825039b37SCy Schubert 		char buf[256];
96925039b37SCy Schubert 	} ancil;
970b7579f77SDag-Erling Smørgrav 	int i;
971b7579f77SDag-Erling Smørgrav #ifndef S_SPLINT_S
972b7579f77SDag-Erling Smørgrav 	struct cmsghdr* cmsg;
973b7579f77SDag-Erling Smørgrav #endif /* S_SPLINT_S */
9748f76bb7dSCy Schubert #ifdef HAVE_LINUX_NET_TSTAMP_H
9758f76bb7dSCy Schubert 	struct timespec *ts;
9768f76bb7dSCy Schubert #endif /* HAVE_LINUX_NET_TSTAMP_H */
977b7579f77SDag-Erling Smørgrav 
978b7579f77SDag-Erling Smørgrav 	rep.c = (struct comm_point*)arg;
979b7579f77SDag-Erling Smørgrav 	log_assert(rep.c->type == comm_udp);
980b7579f77SDag-Erling Smørgrav 
981e2d15004SDag-Erling Smørgrav 	if(!(event&UB_EV_READ))
982b7579f77SDag-Erling Smørgrav 		return;
983b7579f77SDag-Erling Smørgrav 	log_assert(rep.c && rep.c->buffer && rep.c->fd == fd);
984e2d15004SDag-Erling Smørgrav 	ub_comm_base_now(rep.c->ev->base);
985b7579f77SDag-Erling Smørgrav 	for(i=0; i<NUM_UDP_PER_SELECT; i++) {
98617d15b25SDag-Erling Smørgrav 		sldns_buffer_clear(rep.c->buffer);
9878f76bb7dSCy Schubert 		timeval_clear(&rep.c->recv_tv);
988865f46b2SCy Schubert 		rep.remote_addrlen = (socklen_t)sizeof(rep.remote_addr);
989b7579f77SDag-Erling Smørgrav 		log_assert(fd != -1);
99017d15b25SDag-Erling Smørgrav 		log_assert(sldns_buffer_remaining(rep.c->buffer) > 0);
991865f46b2SCy Schubert 		msg.msg_name = &rep.remote_addr;
992865f46b2SCy Schubert 		msg.msg_namelen = (socklen_t)sizeof(rep.remote_addr);
99317d15b25SDag-Erling Smørgrav 		iov[0].iov_base = sldns_buffer_begin(rep.c->buffer);
99417d15b25SDag-Erling Smørgrav 		iov[0].iov_len = sldns_buffer_remaining(rep.c->buffer);
995b7579f77SDag-Erling Smørgrav 		msg.msg_iov = iov;
996b7579f77SDag-Erling Smørgrav 		msg.msg_iovlen = 1;
99725039b37SCy Schubert 		msg.msg_control = ancil.buf;
998b7579f77SDag-Erling Smørgrav #ifndef S_SPLINT_S
99925039b37SCy Schubert 		msg.msg_controllen = sizeof(ancil.buf);
1000b7579f77SDag-Erling Smørgrav #endif /* S_SPLINT_S */
1001b7579f77SDag-Erling Smørgrav 		msg.msg_flags = 0;
1002865f46b2SCy Schubert 		rcv = recvmsg(fd, &msg, MSG_DONTWAIT);
1003b7579f77SDag-Erling Smørgrav 		if(rcv == -1) {
1004369c6923SCy Schubert 			if(errno != EAGAIN && errno != EINTR
1005369c6923SCy Schubert 				&& udp_recv_needs_log(errno)) {
1006b7579f77SDag-Erling Smørgrav 				log_err("recvmsg failed: %s", strerror(errno));
1007b7579f77SDag-Erling Smørgrav 			}
1008b7579f77SDag-Erling Smørgrav 			return;
1009b7579f77SDag-Erling Smørgrav 		}
1010865f46b2SCy Schubert 		rep.remote_addrlen = msg.msg_namelen;
101117d15b25SDag-Erling Smørgrav 		sldns_buffer_skip(rep.c->buffer, rcv);
101217d15b25SDag-Erling Smørgrav 		sldns_buffer_flip(rep.c->buffer);
1013b7579f77SDag-Erling Smørgrav 		rep.srctype = 0;
1014865f46b2SCy Schubert 		rep.is_proxied = 0;
1015b7579f77SDag-Erling Smørgrav #ifndef S_SPLINT_S
1016b7579f77SDag-Erling Smørgrav 		for(cmsg = CMSG_FIRSTHDR(&msg); cmsg != NULL;
1017b7579f77SDag-Erling Smørgrav 			cmsg = CMSG_NXTHDR(&msg, cmsg)) {
1018b7579f77SDag-Erling Smørgrav 			if( cmsg->cmsg_level == IPPROTO_IPV6 &&
1019b7579f77SDag-Erling Smørgrav 				cmsg->cmsg_type == IPV6_PKTINFO) {
1020b7579f77SDag-Erling Smørgrav 				rep.srctype = 6;
1021b7579f77SDag-Erling Smørgrav 				memmove(&rep.pktinfo.v6info, CMSG_DATA(cmsg),
1022b7579f77SDag-Erling Smørgrav 					sizeof(struct in6_pktinfo));
1023b7579f77SDag-Erling Smørgrav 				break;
1024b7579f77SDag-Erling Smørgrav #ifdef IP_PKTINFO
1025b7579f77SDag-Erling Smørgrav 			} else if( cmsg->cmsg_level == IPPROTO_IP &&
1026b7579f77SDag-Erling Smørgrav 				cmsg->cmsg_type == IP_PKTINFO) {
1027b7579f77SDag-Erling Smørgrav 				rep.srctype = 4;
1028b7579f77SDag-Erling Smørgrav 				memmove(&rep.pktinfo.v4info, CMSG_DATA(cmsg),
1029b7579f77SDag-Erling Smørgrav 					sizeof(struct in_pktinfo));
1030b7579f77SDag-Erling Smørgrav 				break;
1031b7579f77SDag-Erling Smørgrav #elif defined(IP_RECVDSTADDR)
1032b7579f77SDag-Erling Smørgrav 			} else if( cmsg->cmsg_level == IPPROTO_IP &&
1033b7579f77SDag-Erling Smørgrav 				cmsg->cmsg_type == IP_RECVDSTADDR) {
1034b7579f77SDag-Erling Smørgrav 				rep.srctype = 4;
1035b7579f77SDag-Erling Smørgrav 				memmove(&rep.pktinfo.v4addr, CMSG_DATA(cmsg),
1036b7579f77SDag-Erling Smørgrav 					sizeof(struct in_addr));
1037b7579f77SDag-Erling Smørgrav 				break;
1038b7579f77SDag-Erling Smørgrav #endif /* IP_PKTINFO or IP_RECVDSTADDR */
10398f76bb7dSCy Schubert #ifdef HAVE_LINUX_NET_TSTAMP_H
10408f76bb7dSCy Schubert 			} else if( cmsg->cmsg_level == SOL_SOCKET &&
10418f76bb7dSCy Schubert 				cmsg->cmsg_type == SO_TIMESTAMPNS) {
10428f76bb7dSCy Schubert 				ts = (struct timespec *)CMSG_DATA(cmsg);
10438f76bb7dSCy Schubert 				TIMESPEC_TO_TIMEVAL(&rep.c->recv_tv, ts);
10448f76bb7dSCy Schubert 			} else if( cmsg->cmsg_level == SOL_SOCKET &&
10458f76bb7dSCy Schubert 				cmsg->cmsg_type == SO_TIMESTAMPING) {
10468f76bb7dSCy Schubert 				ts = (struct timespec *)CMSG_DATA(cmsg);
10478f76bb7dSCy Schubert 				TIMESPEC_TO_TIMEVAL(&rep.c->recv_tv, ts);
10488f76bb7dSCy Schubert 			} else if( cmsg->cmsg_level == SOL_SOCKET &&
10498f76bb7dSCy Schubert 				cmsg->cmsg_type == SO_TIMESTAMP) {
10508f76bb7dSCy Schubert 				memmove(&rep.c->recv_tv, CMSG_DATA(cmsg), sizeof(struct timeval));
10518f76bb7dSCy Schubert #endif /* HAVE_LINUX_NET_TSTAMP_H */
1052b7579f77SDag-Erling Smørgrav 			}
1053b7579f77SDag-Erling Smørgrav 		}
10548f76bb7dSCy Schubert 
10558f76bb7dSCy Schubert 		if(verbosity >= VERB_ALGO && rep.srctype != 0)
1056b7579f77SDag-Erling Smørgrav 			p_ancil("receive_udp on interface", &rep);
1057b7579f77SDag-Erling Smørgrav #endif /* S_SPLINT_S */
1058865f46b2SCy Schubert 
1059865f46b2SCy Schubert 		if(rep.c->pp2_enabled && !consume_pp2_header(rep.c->buffer,
1060865f46b2SCy Schubert 			&rep, 0)) {
1061865f46b2SCy Schubert 			log_err("proxy_protocol: could not consume PROXYv2 header");
1062865f46b2SCy Schubert 			return;
1063865f46b2SCy Schubert 		}
1064865f46b2SCy Schubert 		if(!rep.is_proxied) {
1065865f46b2SCy Schubert 			rep.client_addrlen = rep.remote_addrlen;
1066865f46b2SCy Schubert 			memmove(&rep.client_addr, &rep.remote_addr,
1067865f46b2SCy Schubert 				rep.remote_addrlen);
1068865f46b2SCy Schubert 		}
1069865f46b2SCy Schubert 
1070b7579f77SDag-Erling Smørgrav 		fptr_ok(fptr_whitelist_comm_point(rep.c->callback));
1071b7579f77SDag-Erling Smørgrav 		if((*rep.c->callback)(rep.c, rep.c->cb_arg, NETEVENT_NOERROR, &rep)) {
1072b7579f77SDag-Erling Smørgrav 			/* send back immediate reply */
1073103ba509SCy Schubert 			struct sldns_buffer *buffer;
1074103ba509SCy Schubert #ifdef USE_DNSCRYPT
1075103ba509SCy Schubert 			buffer = rep.c->dnscrypt_buffer;
1076103ba509SCy Schubert #else
1077103ba509SCy Schubert 			buffer = rep.c->buffer;
1078103ba509SCy Schubert #endif
1079103ba509SCy Schubert 			(void)comm_point_send_udp_msg_if(rep.c, buffer,
1080865f46b2SCy Schubert 				(struct sockaddr*)&rep.remote_addr,
1081865f46b2SCy Schubert 				rep.remote_addrlen, &rep);
1082b7579f77SDag-Erling Smørgrav 		}
108357bddd21SDag-Erling Smørgrav 		if(!rep.c || rep.c->fd == -1) /* commpoint closed */
1084b7579f77SDag-Erling Smørgrav 			break;
1085b7579f77SDag-Erling Smørgrav 	}
1086b7579f77SDag-Erling Smørgrav }
1087103ba509SCy Schubert #endif /* AF_INET6 && IPV6_PKTINFO && HAVE_RECVMSG */
1088b7579f77SDag-Erling Smørgrav 
1089b7579f77SDag-Erling Smørgrav void
1090b7579f77SDag-Erling Smørgrav comm_point_udp_callback(int fd, short event, void* arg)
1091b7579f77SDag-Erling Smørgrav {
1092b7579f77SDag-Erling Smørgrav 	struct comm_reply rep;
1093b7579f77SDag-Erling Smørgrav 	ssize_t rcv;
1094b7579f77SDag-Erling Smørgrav 	int i;
109565b390aaSDag-Erling Smørgrav 	struct sldns_buffer *buffer;
1096b7579f77SDag-Erling Smørgrav 
1097b7579f77SDag-Erling Smørgrav 	rep.c = (struct comm_point*)arg;
1098b7579f77SDag-Erling Smørgrav 	log_assert(rep.c->type == comm_udp);
1099b7579f77SDag-Erling Smørgrav 
1100e2d15004SDag-Erling Smørgrav 	if(!(event&UB_EV_READ))
1101b7579f77SDag-Erling Smørgrav 		return;
1102b7579f77SDag-Erling Smørgrav 	log_assert(rep.c && rep.c->buffer && rep.c->fd == fd);
1103e2d15004SDag-Erling Smørgrav 	ub_comm_base_now(rep.c->ev->base);
1104b7579f77SDag-Erling Smørgrav 	for(i=0; i<NUM_UDP_PER_SELECT; i++) {
110517d15b25SDag-Erling Smørgrav 		sldns_buffer_clear(rep.c->buffer);
1106865f46b2SCy Schubert 		rep.remote_addrlen = (socklen_t)sizeof(rep.remote_addr);
1107b7579f77SDag-Erling Smørgrav 		log_assert(fd != -1);
110817d15b25SDag-Erling Smørgrav 		log_assert(sldns_buffer_remaining(rep.c->buffer) > 0);
110917d15b25SDag-Erling Smørgrav 		rcv = recvfrom(fd, (void*)sldns_buffer_begin(rep.c->buffer),
1110865f46b2SCy Schubert 			sldns_buffer_remaining(rep.c->buffer), MSG_DONTWAIT,
1111865f46b2SCy Schubert 			(struct sockaddr*)&rep.remote_addr, &rep.remote_addrlen);
1112b7579f77SDag-Erling Smørgrav 		if(rcv == -1) {
1113b7579f77SDag-Erling Smørgrav #ifndef USE_WINSOCK
1114369c6923SCy Schubert 			if(errno != EAGAIN && errno != EINTR
1115369c6923SCy Schubert 				&& udp_recv_needs_log(errno))
1116b7579f77SDag-Erling Smørgrav 				log_err("recvfrom %d failed: %s",
1117b7579f77SDag-Erling Smørgrav 					fd, strerror(errno));
1118b7579f77SDag-Erling Smørgrav #else
1119b7579f77SDag-Erling Smørgrav 			if(WSAGetLastError() != WSAEINPROGRESS &&
1120b7579f77SDag-Erling Smørgrav 				WSAGetLastError() != WSAECONNRESET &&
1121f44e67d1SCy Schubert 				WSAGetLastError()!= WSAEWOULDBLOCK &&
1122f44e67d1SCy Schubert 				udp_recv_needs_log(WSAGetLastError()))
1123b7579f77SDag-Erling Smørgrav 				log_err("recvfrom failed: %s",
1124b7579f77SDag-Erling Smørgrav 					wsa_strerror(WSAGetLastError()));
1125b7579f77SDag-Erling Smørgrav #endif
1126b7579f77SDag-Erling Smørgrav 			return;
1127b7579f77SDag-Erling Smørgrav 		}
112817d15b25SDag-Erling Smørgrav 		sldns_buffer_skip(rep.c->buffer, rcv);
112917d15b25SDag-Erling Smørgrav 		sldns_buffer_flip(rep.c->buffer);
1130b7579f77SDag-Erling Smørgrav 		rep.srctype = 0;
1131865f46b2SCy Schubert 		rep.is_proxied = 0;
1132865f46b2SCy Schubert 
1133865f46b2SCy Schubert 		if(rep.c->pp2_enabled && !consume_pp2_header(rep.c->buffer,
1134865f46b2SCy Schubert 			&rep, 0)) {
1135865f46b2SCy Schubert 			log_err("proxy_protocol: could not consume PROXYv2 header");
1136865f46b2SCy Schubert 			return;
1137865f46b2SCy Schubert 		}
1138865f46b2SCy Schubert 		if(!rep.is_proxied) {
1139865f46b2SCy Schubert 			rep.client_addrlen = rep.remote_addrlen;
1140865f46b2SCy Schubert 			memmove(&rep.client_addr, &rep.remote_addr,
1141865f46b2SCy Schubert 				rep.remote_addrlen);
1142865f46b2SCy Schubert 		}
1143865f46b2SCy Schubert 
1144b7579f77SDag-Erling Smørgrav 		fptr_ok(fptr_whitelist_comm_point(rep.c->callback));
1145b7579f77SDag-Erling Smørgrav 		if((*rep.c->callback)(rep.c, rep.c->cb_arg, NETEVENT_NOERROR, &rep)) {
1146b7579f77SDag-Erling Smørgrav 			/* send back immediate reply */
114765b390aaSDag-Erling Smørgrav #ifdef USE_DNSCRYPT
114865b390aaSDag-Erling Smørgrav 			buffer = rep.c->dnscrypt_buffer;
114965b390aaSDag-Erling Smørgrav #else
115065b390aaSDag-Erling Smørgrav 			buffer = rep.c->buffer;
115165b390aaSDag-Erling Smørgrav #endif
115265b390aaSDag-Erling Smørgrav 			(void)comm_point_send_udp_msg(rep.c, buffer,
1153865f46b2SCy Schubert 				(struct sockaddr*)&rep.remote_addr,
1154865f46b2SCy Schubert 				rep.remote_addrlen, 0);
1155b7579f77SDag-Erling Smørgrav 		}
115657bddd21SDag-Erling Smørgrav 		if(!rep.c || rep.c->fd != fd) /* commpoint closed to -1 or reused for
1157b7579f77SDag-Erling Smørgrav 		another UDP port. Note rep.c cannot be reused with TCP fd. */
1158b7579f77SDag-Erling Smørgrav 			break;
1159b7579f77SDag-Erling Smørgrav 	}
1160b7579f77SDag-Erling Smørgrav }
1161b7579f77SDag-Erling Smørgrav 
1162f44e67d1SCy Schubert int adjusted_tcp_timeout(struct comm_point* c)
1163f44e67d1SCy Schubert {
1164f44e67d1SCy Schubert 	if(c->tcp_timeout_msec < TCP_QUERY_TIMEOUT_MINIMUM)
1165f44e67d1SCy Schubert 		return TCP_QUERY_TIMEOUT_MINIMUM;
1166f44e67d1SCy Schubert 	return c->tcp_timeout_msec;
1167f44e67d1SCy Schubert }
1168f44e67d1SCy Schubert 
1169b7579f77SDag-Erling Smørgrav /** Use a new tcp handler for new query fd, set to read query */
1170b7579f77SDag-Erling Smørgrav static void
1171b5663de9SDag-Erling Smørgrav setup_tcp_handler(struct comm_point* c, int fd, int cur, int max)
1172b7579f77SDag-Erling Smørgrav {
11734c75e3aaSDag-Erling Smørgrav 	int handler_usage;
1174c0caa2e2SCy Schubert 	log_assert(c->type == comm_tcp || c->type == comm_http);
1175b7579f77SDag-Erling Smørgrav 	log_assert(c->fd == -1);
117617d15b25SDag-Erling Smørgrav 	sldns_buffer_clear(c->buffer);
117765b390aaSDag-Erling Smørgrav #ifdef USE_DNSCRYPT
117865b390aaSDag-Erling Smørgrav 	if (c->dnscrypt)
117965b390aaSDag-Erling Smørgrav 		sldns_buffer_clear(c->dnscrypt_buffer);
118065b390aaSDag-Erling Smørgrav #endif
1181b7579f77SDag-Erling Smørgrav 	c->tcp_is_reading = 1;
1182b7579f77SDag-Erling Smørgrav 	c->tcp_byte_count = 0;
118324e36522SCy Schubert 	c->tcp_keepalive = 0;
1184b5663de9SDag-Erling Smørgrav 	/* if more than half the tcp handlers are in use, use a shorter
1185b5663de9SDag-Erling Smørgrav 	 * timeout for this TCP connection, we need to make space for
1186b5663de9SDag-Erling Smørgrav 	 * other connections to be able to get attention */
11874c75e3aaSDag-Erling Smørgrav 	/* If > 50% TCP handler structures in use, set timeout to 1/100th
11884c75e3aaSDag-Erling Smørgrav 	 * 	configured value.
11894c75e3aaSDag-Erling Smørgrav 	 * If > 65%TCP handler structures in use, set to 1/500th configured
11904c75e3aaSDag-Erling Smørgrav 	 * 	value.
11914c75e3aaSDag-Erling Smørgrav 	 * If > 80% TCP handler structures in use, set to 0.
11924c75e3aaSDag-Erling Smørgrav 	 *
11934c75e3aaSDag-Erling Smørgrav 	 * If the timeout to use falls below 200 milliseconds, an actual
11944c75e3aaSDag-Erling Smørgrav 	 * timeout of 200ms is used.
11954c75e3aaSDag-Erling Smørgrav 	 */
11964c75e3aaSDag-Erling Smørgrav 	handler_usage = (cur * 100) / max;
11974c75e3aaSDag-Erling Smørgrav 	if(handler_usage > 50 && handler_usage <= 65)
11984c75e3aaSDag-Erling Smørgrav 		c->tcp_timeout_msec /= 100;
11994c75e3aaSDag-Erling Smørgrav 	else if (handler_usage > 65 && handler_usage <= 80)
12004c75e3aaSDag-Erling Smørgrav 		c->tcp_timeout_msec /= 500;
12014c75e3aaSDag-Erling Smørgrav 	else if (handler_usage > 80)
12024c75e3aaSDag-Erling Smørgrav 		c->tcp_timeout_msec = 0;
1203f44e67d1SCy Schubert 	comm_point_start_listening(c, fd, adjusted_tcp_timeout(c));
1204b7579f77SDag-Erling Smørgrav }
1205b7579f77SDag-Erling Smørgrav 
1206b7579f77SDag-Erling Smørgrav void comm_base_handle_slow_accept(int ATTR_UNUSED(fd),
1207b7579f77SDag-Erling Smørgrav 	short ATTR_UNUSED(event), void* arg)
1208b7579f77SDag-Erling Smørgrav {
1209b7579f77SDag-Erling Smørgrav 	struct comm_base* b = (struct comm_base*)arg;
1210b7579f77SDag-Erling Smørgrav 	/* timeout for the slow accept, re-enable accepts again */
1211b7579f77SDag-Erling Smørgrav 	if(b->start_accept) {
1212b7579f77SDag-Erling Smørgrav 		verbose(VERB_ALGO, "wait is over, slow accept disabled");
1213b7579f77SDag-Erling Smørgrav 		fptr_ok(fptr_whitelist_start_accept(b->start_accept));
1214b7579f77SDag-Erling Smørgrav 		(*b->start_accept)(b->cb_arg);
1215b7579f77SDag-Erling Smørgrav 		b->eb->slow_accept_enabled = 0;
1216b7579f77SDag-Erling Smørgrav 	}
1217b7579f77SDag-Erling Smørgrav }
1218b7579f77SDag-Erling Smørgrav 
1219b7579f77SDag-Erling Smørgrav int comm_point_perform_accept(struct comm_point* c,
1220b7579f77SDag-Erling Smørgrav 	struct sockaddr_storage* addr, socklen_t* addrlen)
1221b7579f77SDag-Erling Smørgrav {
1222b7579f77SDag-Erling Smørgrav 	int new_fd;
1223b7579f77SDag-Erling Smørgrav 	*addrlen = (socklen_t)sizeof(*addr);
12243bd4df0aSDag-Erling Smørgrav #ifndef HAVE_ACCEPT4
1225b7579f77SDag-Erling Smørgrav 	new_fd = accept(c->fd, (struct sockaddr*)addr, addrlen);
12263bd4df0aSDag-Erling Smørgrav #else
12273bd4df0aSDag-Erling Smørgrav 	/* SOCK_NONBLOCK saves extra calls to fcntl for the same result */
12283bd4df0aSDag-Erling Smørgrav 	new_fd = accept4(c->fd, (struct sockaddr*)addr, addrlen, SOCK_NONBLOCK);
12293bd4df0aSDag-Erling Smørgrav #endif
1230b7579f77SDag-Erling Smørgrav 	if(new_fd == -1) {
1231b7579f77SDag-Erling Smørgrav #ifndef USE_WINSOCK
1232b7579f77SDag-Erling Smørgrav 		/* EINTR is signal interrupt. others are closed connection. */
1233b7579f77SDag-Erling Smørgrav 		if(	errno == EINTR || errno == EAGAIN
1234b7579f77SDag-Erling Smørgrav #ifdef EWOULDBLOCK
1235b7579f77SDag-Erling Smørgrav 			|| errno == EWOULDBLOCK
1236b7579f77SDag-Erling Smørgrav #endif
1237b7579f77SDag-Erling Smørgrav #ifdef ECONNABORTED
1238b7579f77SDag-Erling Smørgrav 			|| errno == ECONNABORTED
1239b7579f77SDag-Erling Smørgrav #endif
1240b7579f77SDag-Erling Smørgrav #ifdef EPROTO
1241b7579f77SDag-Erling Smørgrav 			|| errno == EPROTO
1242b7579f77SDag-Erling Smørgrav #endif /* EPROTO */
1243b7579f77SDag-Erling Smørgrav 			)
1244b7579f77SDag-Erling Smørgrav 			return -1;
1245b7579f77SDag-Erling Smørgrav #if defined(ENFILE) && defined(EMFILE)
1246b7579f77SDag-Erling Smørgrav 		if(errno == ENFILE || errno == EMFILE) {
1247b7579f77SDag-Erling Smørgrav 			/* out of file descriptors, likely outside of our
1248b7579f77SDag-Erling Smørgrav 			 * control. stop accept() calls for some time */
1249b7579f77SDag-Erling Smørgrav 			if(c->ev->base->stop_accept) {
1250b7579f77SDag-Erling Smørgrav 				struct comm_base* b = c->ev->base;
1251b7579f77SDag-Erling Smørgrav 				struct timeval tv;
1252b7579f77SDag-Erling Smørgrav 				verbose(VERB_ALGO, "out of file descriptors: "
1253b7579f77SDag-Erling Smørgrav 					"slow accept");
1254865f46b2SCy Schubert 				ub_comm_base_now(b);
1255865f46b2SCy Schubert 				if(b->eb->last_slow_log+SLOW_LOG_TIME <=
1256865f46b2SCy Schubert 					b->eb->secs) {
1257865f46b2SCy Schubert 					b->eb->last_slow_log = b->eb->secs;
1258865f46b2SCy Schubert 					verbose(VERB_OPS, "accept failed, "
1259865f46b2SCy Schubert 						"slow down accept for %d "
1260865f46b2SCy Schubert 						"msec: %s",
1261865f46b2SCy Schubert 						NETEVENT_SLOW_ACCEPT_TIME,
1262865f46b2SCy Schubert 						sock_strerror(errno));
1263865f46b2SCy Schubert 				}
1264b7579f77SDag-Erling Smørgrav 				b->eb->slow_accept_enabled = 1;
1265b7579f77SDag-Erling Smørgrav 				fptr_ok(fptr_whitelist_stop_accept(
1266b7579f77SDag-Erling Smørgrav 					b->stop_accept));
1267b7579f77SDag-Erling Smørgrav 				(*b->stop_accept)(b->cb_arg);
1268b7579f77SDag-Erling Smørgrav 				/* set timeout, no mallocs */
1269b7579f77SDag-Erling Smørgrav 				tv.tv_sec = NETEVENT_SLOW_ACCEPT_TIME/1000;
1270b5663de9SDag-Erling Smørgrav 				tv.tv_usec = (NETEVENT_SLOW_ACCEPT_TIME%1000)*1000;
1271e2d15004SDag-Erling Smørgrav 				b->eb->slow_accept = ub_event_new(b->eb->base,
1272e2d15004SDag-Erling Smørgrav 					-1, UB_EV_TIMEOUT,
1273b7579f77SDag-Erling Smørgrav 					comm_base_handle_slow_accept, b);
1274e2d15004SDag-Erling Smørgrav 				if(b->eb->slow_accept == NULL) {
1275b7579f77SDag-Erling Smørgrav 					/* we do not want to log here, because
1276b7579f77SDag-Erling Smørgrav 					 * that would spam the logfiles.
1277b7579f77SDag-Erling Smørgrav 					 * error: "event_base_set failed." */
1278b7579f77SDag-Erling Smørgrav 				}
1279e2d15004SDag-Erling Smørgrav 				else if(ub_event_add(b->eb->slow_accept, &tv)
1280e2d15004SDag-Erling Smørgrav 					!= 0) {
1281b7579f77SDag-Erling Smørgrav 					/* we do not want to log here,
1282b7579f77SDag-Erling Smørgrav 					 * error: "event_add failed." */
1283b7579f77SDag-Erling Smørgrav 				}
1284865f46b2SCy Schubert 			} else {
1285865f46b2SCy Schubert 				log_err("accept, with no slow down, "
1286865f46b2SCy Schubert 					"failed: %s", sock_strerror(errno));
1287b7579f77SDag-Erling Smørgrav 			}
1288b7579f77SDag-Erling Smørgrav 			return -1;
1289b7579f77SDag-Erling Smørgrav 		}
1290b7579f77SDag-Erling Smørgrav #endif
1291b7579f77SDag-Erling Smørgrav #else /* USE_WINSOCK */
1292b7579f77SDag-Erling Smørgrav 		if(WSAGetLastError() == WSAEINPROGRESS ||
1293b7579f77SDag-Erling Smørgrav 			WSAGetLastError() == WSAECONNRESET)
1294b7579f77SDag-Erling Smørgrav 			return -1;
1295b7579f77SDag-Erling Smørgrav 		if(WSAGetLastError() == WSAEWOULDBLOCK) {
1296e2d15004SDag-Erling Smørgrav 			ub_winsock_tcp_wouldblock(c->ev->ev, UB_EV_READ);
1297b7579f77SDag-Erling Smørgrav 			return -1;
1298b7579f77SDag-Erling Smørgrav 		}
1299b7579f77SDag-Erling Smørgrav #endif
1300c0caa2e2SCy Schubert 		log_err_addr("accept failed", sock_strerror(errno), addr,
1301c0caa2e2SCy Schubert 			*addrlen);
1302b7579f77SDag-Erling Smørgrav 		return -1;
1303b7579f77SDag-Erling Smørgrav 	}
13044c75e3aaSDag-Erling Smørgrav 	if(c->tcp_conn_limit && c->type == comm_tcp_accept) {
13054c75e3aaSDag-Erling Smørgrav 		c->tcl_addr = tcl_addr_lookup(c->tcp_conn_limit, addr, *addrlen);
13064c75e3aaSDag-Erling Smørgrav 		if(!tcl_new_connection(c->tcl_addr)) {
13074c75e3aaSDag-Erling Smørgrav 			if(verbosity >= 3)
13084c75e3aaSDag-Erling Smørgrav 				log_err_addr("accept rejected",
13094c75e3aaSDag-Erling Smørgrav 				"connection limit exceeded", addr, *addrlen);
13104c75e3aaSDag-Erling Smørgrav 			close(new_fd);
13114c75e3aaSDag-Erling Smørgrav 			return -1;
13124c75e3aaSDag-Erling Smørgrav 		}
13134c75e3aaSDag-Erling Smørgrav 	}
13143bd4df0aSDag-Erling Smørgrav #ifndef HAVE_ACCEPT4
1315b7579f77SDag-Erling Smørgrav 	fd_set_nonblock(new_fd);
13163bd4df0aSDag-Erling Smørgrav #endif
1317b7579f77SDag-Erling Smørgrav 	return new_fd;
1318b7579f77SDag-Erling Smørgrav }
1319b7579f77SDag-Erling Smørgrav 
1320b7579f77SDag-Erling Smørgrav #ifdef USE_WINSOCK
1321b7579f77SDag-Erling Smørgrav static long win_bio_cb(BIO *b, int oper, const char* ATTR_UNUSED(argp),
132224e36522SCy Schubert #ifdef HAVE_BIO_SET_CALLBACK_EX
132324e36522SCy Schubert 	size_t ATTR_UNUSED(len),
132424e36522SCy Schubert #endif
132524e36522SCy Schubert         int ATTR_UNUSED(argi), long argl,
132624e36522SCy Schubert #ifndef HAVE_BIO_SET_CALLBACK_EX
132724e36522SCy Schubert 	long retvalue
132824e36522SCy Schubert #else
132924e36522SCy Schubert 	int retvalue, size_t* ATTR_UNUSED(processed)
133024e36522SCy Schubert #endif
133124e36522SCy Schubert 	)
1332b7579f77SDag-Erling Smørgrav {
13333bd4df0aSDag-Erling Smørgrav 	int wsa_err = WSAGetLastError(); /* store errcode before it is gone */
1334b7579f77SDag-Erling Smørgrav 	verbose(VERB_ALGO, "bio_cb %d, %s %s %s", oper,
1335b7579f77SDag-Erling Smørgrav 		(oper&BIO_CB_RETURN)?"return":"before",
1336b7579f77SDag-Erling Smørgrav 		(oper&BIO_CB_READ)?"read":((oper&BIO_CB_WRITE)?"write":"other"),
13373bd4df0aSDag-Erling Smørgrav 		wsa_err==WSAEWOULDBLOCK?"wsawb":"");
1338b7579f77SDag-Erling Smørgrav 	/* on windows, check if previous operation caused EWOULDBLOCK */
1339b7579f77SDag-Erling Smørgrav 	if( (oper == (BIO_CB_READ|BIO_CB_RETURN) && argl == 0) ||
1340b7579f77SDag-Erling Smørgrav 		(oper == (BIO_CB_GETS|BIO_CB_RETURN) && argl == 0)) {
13413bd4df0aSDag-Erling Smørgrav 		if(wsa_err == WSAEWOULDBLOCK)
1342e2d15004SDag-Erling Smørgrav 			ub_winsock_tcp_wouldblock((struct ub_event*)
1343e2d15004SDag-Erling Smørgrav 				BIO_get_callback_arg(b), UB_EV_READ);
1344b7579f77SDag-Erling Smørgrav 	}
1345b7579f77SDag-Erling Smørgrav 	if( (oper == (BIO_CB_WRITE|BIO_CB_RETURN) && argl == 0) ||
1346b7579f77SDag-Erling Smørgrav 		(oper == (BIO_CB_PUTS|BIO_CB_RETURN) && argl == 0)) {
13473bd4df0aSDag-Erling Smørgrav 		if(wsa_err == WSAEWOULDBLOCK)
1348e2d15004SDag-Erling Smørgrav 			ub_winsock_tcp_wouldblock((struct ub_event*)
1349e2d15004SDag-Erling Smørgrav 				BIO_get_callback_arg(b), UB_EV_WRITE);
1350b7579f77SDag-Erling Smørgrav 	}
1351b7579f77SDag-Erling Smørgrav 	/* return original return value */
1352b7579f77SDag-Erling Smørgrav 	return retvalue;
1353b7579f77SDag-Erling Smørgrav }
1354b7579f77SDag-Erling Smørgrav 
1355b7579f77SDag-Erling Smørgrav /** set win bio callbacks for nonblocking operations */
1356b7579f77SDag-Erling Smørgrav void
1357b7579f77SDag-Erling Smørgrav comm_point_tcp_win_bio_cb(struct comm_point* c, void* thessl)
1358b7579f77SDag-Erling Smørgrav {
1359b7579f77SDag-Erling Smørgrav 	SSL* ssl = (SSL*)thessl;
1360b7579f77SDag-Erling Smørgrav 	/* set them both just in case, but usually they are the same BIO */
136124e36522SCy Schubert #ifdef HAVE_BIO_SET_CALLBACK_EX
136224e36522SCy Schubert 	BIO_set_callback_ex(SSL_get_rbio(ssl), &win_bio_cb);
136324e36522SCy Schubert #else
1364b7579f77SDag-Erling Smørgrav 	BIO_set_callback(SSL_get_rbio(ssl), &win_bio_cb);
136524e36522SCy Schubert #endif
1366e2d15004SDag-Erling Smørgrav 	BIO_set_callback_arg(SSL_get_rbio(ssl), (char*)c->ev->ev);
136724e36522SCy Schubert #ifdef HAVE_BIO_SET_CALLBACK_EX
136824e36522SCy Schubert 	BIO_set_callback_ex(SSL_get_wbio(ssl), &win_bio_cb);
136924e36522SCy Schubert #else
1370b7579f77SDag-Erling Smørgrav 	BIO_set_callback(SSL_get_wbio(ssl), &win_bio_cb);
137124e36522SCy Schubert #endif
1372e2d15004SDag-Erling Smørgrav 	BIO_set_callback_arg(SSL_get_wbio(ssl), (char*)c->ev->ev);
1373b7579f77SDag-Erling Smørgrav }
1374b7579f77SDag-Erling Smørgrav #endif
1375b7579f77SDag-Erling Smørgrav 
1376c0caa2e2SCy Schubert #ifdef HAVE_NGHTTP2
1377c0caa2e2SCy Schubert /** Create http2 session server.  Per connection, after TCP accepted.*/
1378c0caa2e2SCy Schubert static int http2_session_server_create(struct http2_session* h2_session)
1379c0caa2e2SCy Schubert {
1380c0caa2e2SCy Schubert 	log_assert(h2_session->callbacks);
1381c0caa2e2SCy Schubert 	h2_session->is_drop = 0;
1382c0caa2e2SCy Schubert 	if(nghttp2_session_server_new(&h2_session->session,
1383c0caa2e2SCy Schubert 			h2_session->callbacks,
1384c0caa2e2SCy Schubert 		h2_session) == NGHTTP2_ERR_NOMEM) {
1385c0caa2e2SCy Schubert 		log_err("failed to create nghttp2 session server");
1386c0caa2e2SCy Schubert 		return 0;
1387c0caa2e2SCy Schubert 	}
1388c0caa2e2SCy Schubert 
1389c0caa2e2SCy Schubert 	return 1;
1390c0caa2e2SCy Schubert }
1391c0caa2e2SCy Schubert 
1392c0caa2e2SCy Schubert /** Submit http2 setting to session. Once per session. */
1393c0caa2e2SCy Schubert static int http2_submit_settings(struct http2_session* h2_session)
1394c0caa2e2SCy Schubert {
1395c0caa2e2SCy Schubert 	int ret;
1396c0caa2e2SCy Schubert 	nghttp2_settings_entry settings[1] = {
1397c0caa2e2SCy Schubert 		{NGHTTP2_SETTINGS_MAX_CONCURRENT_STREAMS,
1398c0caa2e2SCy Schubert 		 h2_session->c->http2_max_streams}};
1399c0caa2e2SCy Schubert 
1400c0caa2e2SCy Schubert 	ret = nghttp2_submit_settings(h2_session->session, NGHTTP2_FLAG_NONE,
1401c0caa2e2SCy Schubert 		settings, 1);
1402c0caa2e2SCy Schubert 	if(ret) {
1403c0caa2e2SCy Schubert 		verbose(VERB_QUERY, "http2: submit_settings failed, "
1404c0caa2e2SCy Schubert 			"error: %s", nghttp2_strerror(ret));
1405c0caa2e2SCy Schubert 		return 0;
1406c0caa2e2SCy Schubert 	}
1407c0caa2e2SCy Schubert 	return 1;
1408c0caa2e2SCy Schubert }
1409c0caa2e2SCy Schubert #endif /* HAVE_NGHTTP2 */
1410c0caa2e2SCy Schubert 
1411c0caa2e2SCy Schubert 
1412b7579f77SDag-Erling Smørgrav void
1413b7579f77SDag-Erling Smørgrav comm_point_tcp_accept_callback(int fd, short event, void* arg)
1414b7579f77SDag-Erling Smørgrav {
1415b7579f77SDag-Erling Smørgrav 	struct comm_point* c = (struct comm_point*)arg, *c_hdl;
1416b7579f77SDag-Erling Smørgrav 	int new_fd;
1417b7579f77SDag-Erling Smørgrav 	log_assert(c->type == comm_tcp_accept);
1418e2d15004SDag-Erling Smørgrav 	if(!(event & UB_EV_READ)) {
1419b7579f77SDag-Erling Smørgrav 		log_info("ignoring tcp accept event %d", (int)event);
1420b7579f77SDag-Erling Smørgrav 		return;
1421b7579f77SDag-Erling Smørgrav 	}
1422e2d15004SDag-Erling Smørgrav 	ub_comm_base_now(c->ev->base);
1423b7579f77SDag-Erling Smørgrav 	/* find free tcp handler. */
1424b7579f77SDag-Erling Smørgrav 	if(!c->tcp_free) {
1425b7579f77SDag-Erling Smørgrav 		log_warn("accepted too many tcp, connections full");
1426b7579f77SDag-Erling Smørgrav 		return;
1427b7579f77SDag-Erling Smørgrav 	}
1428b7579f77SDag-Erling Smørgrav 	/* accept incoming connection. */
1429b7579f77SDag-Erling Smørgrav 	c_hdl = c->tcp_free;
1430e86b9096SDag-Erling Smørgrav 	/* clear leftover flags from previous use, and then set the
1431e86b9096SDag-Erling Smørgrav 	 * correct event base for the event structure for libevent */
1432e86b9096SDag-Erling Smørgrav 	ub_event_free(c_hdl->ev->ev);
143324e36522SCy Schubert 	c_hdl->ev->ev = NULL;
1434369c6923SCy Schubert 	if((c_hdl->type == comm_tcp && c_hdl->tcp_req_info) ||
1435369c6923SCy Schubert 		c_hdl->type == comm_local || c_hdl->type == comm_raw)
1436369c6923SCy Schubert 		c_hdl->tcp_do_toggle_rw = 0;
1437369c6923SCy Schubert 	else	c_hdl->tcp_do_toggle_rw = 1;
1438c0caa2e2SCy Schubert 
1439c0caa2e2SCy Schubert 	if(c_hdl->type == comm_http) {
1440c0caa2e2SCy Schubert #ifdef HAVE_NGHTTP2
1441c0caa2e2SCy Schubert 		if(!c_hdl->h2_session ||
1442c0caa2e2SCy Schubert 			!http2_session_server_create(c_hdl->h2_session)) {
1443c0caa2e2SCy Schubert 			log_warn("failed to create nghttp2");
1444c0caa2e2SCy Schubert 			return;
1445c0caa2e2SCy Schubert 		}
1446c0caa2e2SCy Schubert 		if(!c_hdl->h2_session ||
1447c0caa2e2SCy Schubert 			!http2_submit_settings(c_hdl->h2_session)) {
1448c0caa2e2SCy Schubert 			log_warn("failed to submit http2 settings");
1449c0caa2e2SCy Schubert 			return;
1450c0caa2e2SCy Schubert 		}
1451369c6923SCy Schubert 		if(!c->ssl) {
1452369c6923SCy Schubert 			c_hdl->tcp_do_toggle_rw = 0;
1453369c6923SCy Schubert 			c_hdl->use_h2 = 1;
1454369c6923SCy Schubert 		}
1455c0caa2e2SCy Schubert #endif
1456c0caa2e2SCy Schubert 		c_hdl->ev->ev = ub_event_new(c_hdl->ev->base->eb->base, -1,
1457c0caa2e2SCy Schubert 			UB_EV_PERSIST | UB_EV_READ | UB_EV_TIMEOUT,
1458c0caa2e2SCy Schubert 			comm_point_http_handle_callback, c_hdl);
1459c0caa2e2SCy Schubert 	} else {
1460c0caa2e2SCy Schubert 		c_hdl->ev->ev = ub_event_new(c_hdl->ev->base->eb->base, -1,
1461c0caa2e2SCy Schubert 			UB_EV_PERSIST | UB_EV_READ | UB_EV_TIMEOUT,
1462c0caa2e2SCy Schubert 			comm_point_tcp_handle_callback, c_hdl);
1463c0caa2e2SCy Schubert 	}
1464e86b9096SDag-Erling Smørgrav 	if(!c_hdl->ev->ev) {
1465e86b9096SDag-Erling Smørgrav 		log_warn("could not ub_event_new, dropped tcp");
1466e86b9096SDag-Erling Smørgrav 		return;
1467e86b9096SDag-Erling Smørgrav 	}
1468b7579f77SDag-Erling Smørgrav 	log_assert(fd != -1);
1469b5663de9SDag-Erling Smørgrav 	(void)fd;
1470865f46b2SCy Schubert 	new_fd = comm_point_perform_accept(c, &c_hdl->repinfo.remote_addr,
1471865f46b2SCy Schubert 		&c_hdl->repinfo.remote_addrlen);
1472b7579f77SDag-Erling Smørgrav 	if(new_fd == -1)
1473b7579f77SDag-Erling Smørgrav 		return;
1474865f46b2SCy Schubert 	/* Copy remote_address to client_address.
1475865f46b2SCy Schubert 	 * Simplest way/time for streams to do that. */
1476865f46b2SCy Schubert 	c_hdl->repinfo.client_addrlen = c_hdl->repinfo.remote_addrlen;
1477865f46b2SCy Schubert 	memmove(&c_hdl->repinfo.client_addr,
1478865f46b2SCy Schubert 		&c_hdl->repinfo.remote_addr,
1479865f46b2SCy Schubert 		c_hdl->repinfo.remote_addrlen);
1480b7579f77SDag-Erling Smørgrav 	if(c->ssl) {
1481b7579f77SDag-Erling Smørgrav 		c_hdl->ssl = incoming_ssl_fd(c->ssl, new_fd);
1482b7579f77SDag-Erling Smørgrav 		if(!c_hdl->ssl) {
1483b7579f77SDag-Erling Smørgrav 			c_hdl->fd = new_fd;
1484b7579f77SDag-Erling Smørgrav 			comm_point_close(c_hdl);
1485b7579f77SDag-Erling Smørgrav 			return;
1486b7579f77SDag-Erling Smørgrav 		}
1487b7579f77SDag-Erling Smørgrav 		c_hdl->ssl_shake_state = comm_ssl_shake_read;
1488b7579f77SDag-Erling Smørgrav #ifdef USE_WINSOCK
1489b7579f77SDag-Erling Smørgrav 		comm_point_tcp_win_bio_cb(c_hdl, c_hdl->ssl);
1490b7579f77SDag-Erling Smørgrav #endif
1491b7579f77SDag-Erling Smørgrav 	}
1492b7579f77SDag-Erling Smørgrav 
1493b7579f77SDag-Erling Smørgrav 	/* grab the tcp handler buffers */
149409a3aaf3SDag-Erling Smørgrav 	c->cur_tcp_count++;
1495b7579f77SDag-Erling Smørgrav 	c->tcp_free = c_hdl->tcp_free;
149624e36522SCy Schubert 	c_hdl->tcp_free = NULL;
1497b7579f77SDag-Erling Smørgrav 	if(!c->tcp_free) {
1498b7579f77SDag-Erling Smørgrav 		/* stop accepting incoming queries for now. */
1499b7579f77SDag-Erling Smørgrav 		comm_point_stop_listening(c);
1500b7579f77SDag-Erling Smørgrav 	}
1501b5663de9SDag-Erling Smørgrav 	setup_tcp_handler(c_hdl, new_fd, c->cur_tcp_count, c->max_tcp_count);
1502b7579f77SDag-Erling Smørgrav }
1503b7579f77SDag-Erling Smørgrav 
1504b7579f77SDag-Erling Smørgrav /** Make tcp handler free for next assignment */
1505b7579f77SDag-Erling Smørgrav static void
1506b7579f77SDag-Erling Smørgrav reclaim_tcp_handler(struct comm_point* c)
1507b7579f77SDag-Erling Smørgrav {
1508b7579f77SDag-Erling Smørgrav 	log_assert(c->type == comm_tcp);
1509b7579f77SDag-Erling Smørgrav 	if(c->ssl) {
15108ed2b524SDag-Erling Smørgrav #ifdef HAVE_SSL
1511b7579f77SDag-Erling Smørgrav 		SSL_shutdown(c->ssl);
1512b7579f77SDag-Erling Smørgrav 		SSL_free(c->ssl);
1513b7579f77SDag-Erling Smørgrav 		c->ssl = NULL;
15148ed2b524SDag-Erling Smørgrav #endif
1515b7579f77SDag-Erling Smørgrav 	}
1516b7579f77SDag-Erling Smørgrav 	comm_point_close(c);
1517b7579f77SDag-Erling Smørgrav 	if(c->tcp_parent) {
151824e36522SCy Schubert 		if(c != c->tcp_parent->tcp_free) {
151909a3aaf3SDag-Erling Smørgrav 			c->tcp_parent->cur_tcp_count--;
1520b7579f77SDag-Erling Smørgrav 			c->tcp_free = c->tcp_parent->tcp_free;
1521b7579f77SDag-Erling Smørgrav 			c->tcp_parent->tcp_free = c;
152224e36522SCy Schubert 		}
1523b7579f77SDag-Erling Smørgrav 		if(!c->tcp_free) {
1524b7579f77SDag-Erling Smørgrav 			/* re-enable listening on accept socket */
1525b7579f77SDag-Erling Smørgrav 			comm_point_start_listening(c->tcp_parent, -1, -1);
1526b7579f77SDag-Erling Smørgrav 		}
1527b7579f77SDag-Erling Smørgrav 	}
1528369c6923SCy Schubert 	c->tcp_more_read_again = NULL;
1529369c6923SCy Schubert 	c->tcp_more_write_again = NULL;
15309cf5bc93SCy Schubert 	c->tcp_byte_count = 0;
1531865f46b2SCy Schubert 	c->pp2_header_state = pp2_header_none;
15329cf5bc93SCy Schubert 	sldns_buffer_clear(c->buffer);
1533b7579f77SDag-Erling Smørgrav }
1534b7579f77SDag-Erling Smørgrav 
1535b7579f77SDag-Erling Smørgrav /** do the callback when writing is done */
1536b7579f77SDag-Erling Smørgrav static void
1537b7579f77SDag-Erling Smørgrav tcp_callback_writer(struct comm_point* c)
1538b7579f77SDag-Erling Smørgrav {
1539b7579f77SDag-Erling Smørgrav 	log_assert(c->type == comm_tcp);
1540369c6923SCy Schubert 	if(!c->tcp_write_and_read) {
154117d15b25SDag-Erling Smørgrav 		sldns_buffer_clear(c->buffer);
1542369c6923SCy Schubert 		c->tcp_byte_count = 0;
1543369c6923SCy Schubert 	}
1544b7579f77SDag-Erling Smørgrav 	if(c->tcp_do_toggle_rw)
1545b7579f77SDag-Erling Smørgrav 		c->tcp_is_reading = 1;
1546b7579f77SDag-Erling Smørgrav 	/* switch from listening(write) to listening(read) */
1547e86b9096SDag-Erling Smørgrav 	if(c->tcp_req_info) {
1548e86b9096SDag-Erling Smørgrav 		tcp_req_info_handle_writedone(c->tcp_req_info);
1549e86b9096SDag-Erling Smørgrav 	} else {
1550b7579f77SDag-Erling Smørgrav 		comm_point_stop_listening(c);
1551369c6923SCy Schubert 		if(c->tcp_write_and_read) {
1552369c6923SCy Schubert 			fptr_ok(fptr_whitelist_comm_point(c->callback));
1553369c6923SCy Schubert 			if( (*c->callback)(c, c->cb_arg, NETEVENT_PKT_WRITTEN,
1554369c6923SCy Schubert 				&c->repinfo) ) {
1555369c6923SCy Schubert 				comm_point_start_listening(c, -1,
1556f44e67d1SCy Schubert 					adjusted_tcp_timeout(c));
1557369c6923SCy Schubert 			}
1558369c6923SCy Schubert 		} else {
1559f44e67d1SCy Schubert 			comm_point_start_listening(c, -1,
1560f44e67d1SCy Schubert 					adjusted_tcp_timeout(c));
1561b7579f77SDag-Erling Smørgrav 		}
1562e86b9096SDag-Erling Smørgrav 	}
1563369c6923SCy Schubert }
1564b7579f77SDag-Erling Smørgrav 
1565b7579f77SDag-Erling Smørgrav /** do the callback when reading is done */
1566b7579f77SDag-Erling Smørgrav static void
1567b7579f77SDag-Erling Smørgrav tcp_callback_reader(struct comm_point* c)
1568b7579f77SDag-Erling Smørgrav {
1569b7579f77SDag-Erling Smørgrav 	log_assert(c->type == comm_tcp || c->type == comm_local);
157017d15b25SDag-Erling Smørgrav 	sldns_buffer_flip(c->buffer);
1571b7579f77SDag-Erling Smørgrav 	if(c->tcp_do_toggle_rw)
1572b7579f77SDag-Erling Smørgrav 		c->tcp_is_reading = 0;
1573b7579f77SDag-Erling Smørgrav 	c->tcp_byte_count = 0;
1574e86b9096SDag-Erling Smørgrav 	if(c->tcp_req_info) {
1575e86b9096SDag-Erling Smørgrav 		tcp_req_info_handle_readdone(c->tcp_req_info);
1576e86b9096SDag-Erling Smørgrav 	} else {
1577b7579f77SDag-Erling Smørgrav 		if(c->type == comm_tcp)
1578b7579f77SDag-Erling Smørgrav 			comm_point_stop_listening(c);
1579b7579f77SDag-Erling Smørgrav 		fptr_ok(fptr_whitelist_comm_point(c->callback));
1580b7579f77SDag-Erling Smørgrav 		if( (*c->callback)(c, c->cb_arg, NETEVENT_NOERROR, &c->repinfo) ) {
1581f44e67d1SCy Schubert 			comm_point_start_listening(c, -1,
1582f44e67d1SCy Schubert 					adjusted_tcp_timeout(c));
1583b7579f77SDag-Erling Smørgrav 		}
1584b7579f77SDag-Erling Smørgrav 	}
1585e86b9096SDag-Erling Smørgrav }
1586b7579f77SDag-Erling Smørgrav 
158757bddd21SDag-Erling Smørgrav #ifdef HAVE_SSL
15880eefd307SCy Schubert /** true if the ssl handshake error has to be squelched from the logs */
158925039b37SCy Schubert int
15900eefd307SCy Schubert squelch_err_ssl_handshake(unsigned long err)
15910eefd307SCy Schubert {
15920eefd307SCy Schubert 	if(verbosity >= VERB_QUERY)
15930eefd307SCy Schubert 		return 0; /* only squelch on low verbosity */
1594a39a5a69SCy Schubert 	if(ERR_GET_LIB(err) == ERR_LIB_SSL &&
1595a39a5a69SCy Schubert 		(ERR_GET_REASON(err) == SSL_R_HTTPS_PROXY_REQUEST ||
1596a39a5a69SCy Schubert 		 ERR_GET_REASON(err) == SSL_R_HTTP_REQUEST ||
1597a39a5a69SCy Schubert 		 ERR_GET_REASON(err) == SSL_R_WRONG_VERSION_NUMBER ||
1598a39a5a69SCy Schubert 		 ERR_GET_REASON(err) == SSL_R_SSLV3_ALERT_BAD_CERTIFICATE
15990eefd307SCy Schubert #ifdef SSL_F_TLS_POST_PROCESS_CLIENT_HELLO
1600a39a5a69SCy Schubert 		 || ERR_GET_REASON(err) == SSL_R_NO_SHARED_CIPHER
16010eefd307SCy Schubert #endif
16020eefd307SCy Schubert #ifdef SSL_F_TLS_EARLY_POST_PROCESS_CLIENT_HELLO
1603a39a5a69SCy Schubert 		 || ERR_GET_REASON(err) == SSL_R_UNKNOWN_PROTOCOL
1604a39a5a69SCy Schubert 		 || ERR_GET_REASON(err) == SSL_R_UNSUPPORTED_PROTOCOL
16050eefd307SCy Schubert #  ifdef SSL_R_VERSION_TOO_LOW
1606a39a5a69SCy Schubert 		 || ERR_GET_REASON(err) == SSL_R_VERSION_TOO_LOW
16070eefd307SCy Schubert #  endif
16080eefd307SCy Schubert #endif
1609a39a5a69SCy Schubert 		))
16100eefd307SCy Schubert 		return 1;
16110eefd307SCy Schubert 	return 0;
16120eefd307SCy Schubert }
16130eefd307SCy Schubert #endif /* HAVE_SSL */
16140eefd307SCy Schubert 
1615b7579f77SDag-Erling Smørgrav /** continue ssl handshake */
16168ed2b524SDag-Erling Smørgrav #ifdef HAVE_SSL
1617b7579f77SDag-Erling Smørgrav static int
1618b7579f77SDag-Erling Smørgrav ssl_handshake(struct comm_point* c)
1619b7579f77SDag-Erling Smørgrav {
1620b7579f77SDag-Erling Smørgrav 	int r;
1621b7579f77SDag-Erling Smørgrav 	if(c->ssl_shake_state == comm_ssl_shake_hs_read) {
1622b7579f77SDag-Erling Smørgrav 		/* read condition satisfied back to writing */
16235469a995SCy Schubert 		comm_point_listen_for_rw(c, 0, 1);
1624b7579f77SDag-Erling Smørgrav 		c->ssl_shake_state = comm_ssl_shake_none;
1625b7579f77SDag-Erling Smørgrav 		return 1;
1626b7579f77SDag-Erling Smørgrav 	}
1627b7579f77SDag-Erling Smørgrav 	if(c->ssl_shake_state == comm_ssl_shake_hs_write) {
1628b7579f77SDag-Erling Smørgrav 		/* write condition satisfied, back to reading */
1629b7579f77SDag-Erling Smørgrav 		comm_point_listen_for_rw(c, 1, 0);
1630b7579f77SDag-Erling Smørgrav 		c->ssl_shake_state = comm_ssl_shake_none;
1631b7579f77SDag-Erling Smørgrav 		return 1;
1632b7579f77SDag-Erling Smørgrav 	}
1633b7579f77SDag-Erling Smørgrav 
1634b7579f77SDag-Erling Smørgrav 	ERR_clear_error();
1635b7579f77SDag-Erling Smørgrav 	r = SSL_do_handshake(c->ssl);
1636b7579f77SDag-Erling Smørgrav 	if(r != 1) {
1637b7579f77SDag-Erling Smørgrav 		int want = SSL_get_error(c->ssl, r);
1638b7579f77SDag-Erling Smørgrav 		if(want == SSL_ERROR_WANT_READ) {
1639b7579f77SDag-Erling Smørgrav 			if(c->ssl_shake_state == comm_ssl_shake_read)
1640b7579f77SDag-Erling Smørgrav 				return 1;
1641b7579f77SDag-Erling Smørgrav 			c->ssl_shake_state = comm_ssl_shake_read;
1642b7579f77SDag-Erling Smørgrav 			comm_point_listen_for_rw(c, 1, 0);
1643b7579f77SDag-Erling Smørgrav 			return 1;
1644b7579f77SDag-Erling Smørgrav 		} else if(want == SSL_ERROR_WANT_WRITE) {
1645b7579f77SDag-Erling Smørgrav 			if(c->ssl_shake_state == comm_ssl_shake_write)
1646b7579f77SDag-Erling Smørgrav 				return 1;
1647b7579f77SDag-Erling Smørgrav 			c->ssl_shake_state = comm_ssl_shake_write;
1648b7579f77SDag-Erling Smørgrav 			comm_point_listen_for_rw(c, 0, 1);
1649b7579f77SDag-Erling Smørgrav 			return 1;
1650b7579f77SDag-Erling Smørgrav 		} else if(r == 0) {
1651b7579f77SDag-Erling Smørgrav 			return 0; /* closed */
1652b7579f77SDag-Erling Smørgrav 		} else if(want == SSL_ERROR_SYSCALL) {
1653b7579f77SDag-Erling Smørgrav 			/* SYSCALL and errno==0 means closed uncleanly */
1654091e9e46SCy Schubert #ifdef EPIPE
1655091e9e46SCy Schubert 			if(errno == EPIPE && verbosity < 2)
1656091e9e46SCy Schubert 				return 0; /* silence 'broken pipe' */
1657091e9e46SCy Schubert #endif
1658091e9e46SCy Schubert #ifdef ECONNRESET
1659091e9e46SCy Schubert 			if(errno == ECONNRESET && verbosity < 2)
1660091e9e46SCy Schubert 				return 0; /* silence reset by peer */
1661091e9e46SCy Schubert #endif
1662a39a5a69SCy Schubert 			if(!tcp_connect_errno_needs_log(
1663865f46b2SCy Schubert 				(struct sockaddr*)&c->repinfo.remote_addr,
1664865f46b2SCy Schubert 				c->repinfo.remote_addrlen))
1665a39a5a69SCy Schubert 				return 0; /* silence connect failures that
1666a39a5a69SCy Schubert 				show up because after connect this is the
1667a39a5a69SCy Schubert 				first system call that accesses the socket */
1668b7579f77SDag-Erling Smørgrav 			if(errno != 0)
1669b7579f77SDag-Erling Smørgrav 				log_err("SSL_handshake syscall: %s",
1670b7579f77SDag-Erling Smørgrav 					strerror(errno));
1671b7579f77SDag-Erling Smørgrav 			return 0;
1672b7579f77SDag-Erling Smørgrav 		} else {
16730eefd307SCy Schubert 			unsigned long err = ERR_get_error();
16740eefd307SCy Schubert 			if(!squelch_err_ssl_handshake(err)) {
1675*b7c0c8c1SCy Schubert 				long vr;
1676103ba509SCy Schubert 				log_crypto_err_io_code("ssl handshake failed",
1677103ba509SCy Schubert 					want, err);
1678*b7c0c8c1SCy Schubert 				if((vr=SSL_get_verify_result(c->ssl)) != 0)
1679*b7c0c8c1SCy Schubert 					log_err("ssl handshake cert error: %s",
1680*b7c0c8c1SCy Schubert 						X509_verify_cert_error_string(
1681*b7c0c8c1SCy Schubert 						vr));
1682865f46b2SCy Schubert 				log_addr(VERB_OPS, "ssl handshake failed",
1683865f46b2SCy Schubert 					&c->repinfo.remote_addr,
1684865f46b2SCy Schubert 					c->repinfo.remote_addrlen);
16850eefd307SCy Schubert 			}
1686b7579f77SDag-Erling Smørgrav 			return 0;
1687b7579f77SDag-Erling Smørgrav 		}
1688b7579f77SDag-Erling Smørgrav 	}
1689b7579f77SDag-Erling Smørgrav 	/* this is where peer verification could take place */
169057bddd21SDag-Erling Smørgrav 	if((SSL_get_verify_mode(c->ssl)&SSL_VERIFY_PEER)) {
169157bddd21SDag-Erling Smørgrav 		/* verification */
169257bddd21SDag-Erling Smørgrav 		if(SSL_get_verify_result(c->ssl) == X509_V_OK) {
16935469a995SCy Schubert #ifdef HAVE_SSL_GET1_PEER_CERTIFICATE
16945469a995SCy Schubert 			X509* x = SSL_get1_peer_certificate(c->ssl);
16955469a995SCy Schubert #else
169657bddd21SDag-Erling Smørgrav 			X509* x = SSL_get_peer_certificate(c->ssl);
16975469a995SCy Schubert #endif
169857bddd21SDag-Erling Smørgrav 			if(!x) {
169957bddd21SDag-Erling Smørgrav 				log_addr(VERB_ALGO, "SSL connection failed: "
170057bddd21SDag-Erling Smørgrav 					"no certificate",
1701865f46b2SCy Schubert 					&c->repinfo.remote_addr,
1702865f46b2SCy Schubert 					c->repinfo.remote_addrlen);
170357bddd21SDag-Erling Smørgrav 				return 0;
170457bddd21SDag-Erling Smørgrav 			}
170557bddd21SDag-Erling Smørgrav 			log_cert(VERB_ALGO, "peer certificate", x);
170657bddd21SDag-Erling Smørgrav #ifdef HAVE_SSL_GET0_PEERNAME
170757bddd21SDag-Erling Smørgrav 			if(SSL_get0_peername(c->ssl)) {
170857bddd21SDag-Erling Smørgrav 				char buf[255];
170957bddd21SDag-Erling Smørgrav 				snprintf(buf, sizeof(buf), "SSL connection "
171057bddd21SDag-Erling Smørgrav 					"to %s authenticated",
171157bddd21SDag-Erling Smørgrav 					SSL_get0_peername(c->ssl));
1712865f46b2SCy Schubert 				log_addr(VERB_ALGO, buf, &c->repinfo.remote_addr,
1713865f46b2SCy Schubert 					c->repinfo.remote_addrlen);
171457bddd21SDag-Erling Smørgrav 			} else {
171557bddd21SDag-Erling Smørgrav #endif
171657bddd21SDag-Erling Smørgrav 				log_addr(VERB_ALGO, "SSL connection "
1717865f46b2SCy Schubert 					"authenticated", &c->repinfo.remote_addr,
1718865f46b2SCy Schubert 					c->repinfo.remote_addrlen);
171957bddd21SDag-Erling Smørgrav #ifdef HAVE_SSL_GET0_PEERNAME
172057bddd21SDag-Erling Smørgrav 			}
172157bddd21SDag-Erling Smørgrav #endif
172257bddd21SDag-Erling Smørgrav 			X509_free(x);
172357bddd21SDag-Erling Smørgrav 		} else {
17245469a995SCy Schubert #ifdef HAVE_SSL_GET1_PEER_CERTIFICATE
17255469a995SCy Schubert 			X509* x = SSL_get1_peer_certificate(c->ssl);
17265469a995SCy Schubert #else
172757bddd21SDag-Erling Smørgrav 			X509* x = SSL_get_peer_certificate(c->ssl);
17285469a995SCy Schubert #endif
172957bddd21SDag-Erling Smørgrav 			if(x) {
173057bddd21SDag-Erling Smørgrav 				log_cert(VERB_ALGO, "peer certificate", x);
173157bddd21SDag-Erling Smørgrav 				X509_free(x);
173257bddd21SDag-Erling Smørgrav 			}
173357bddd21SDag-Erling Smørgrav 			log_addr(VERB_ALGO, "SSL connection failed: "
173457bddd21SDag-Erling Smørgrav 				"failed to authenticate",
1735865f46b2SCy Schubert 				&c->repinfo.remote_addr,
1736865f46b2SCy Schubert 				c->repinfo.remote_addrlen);
173757bddd21SDag-Erling Smørgrav 			return 0;
173857bddd21SDag-Erling Smørgrav 		}
173957bddd21SDag-Erling Smørgrav 	} else {
174057bddd21SDag-Erling Smørgrav 		/* unauthenticated, the verify peer flag was not set
174157bddd21SDag-Erling Smørgrav 		 * in c->ssl when the ssl object was created from ssl_ctx */
1742865f46b2SCy Schubert 		log_addr(VERB_ALGO, "SSL connection", &c->repinfo.remote_addr,
1743865f46b2SCy Schubert 			c->repinfo.remote_addrlen);
174457bddd21SDag-Erling Smørgrav 	}
1745b7579f77SDag-Erling Smørgrav 
17465469a995SCy Schubert #ifdef HAVE_SSL_GET0_ALPN_SELECTED
1747c0caa2e2SCy Schubert 	/* check if http2 use is negotiated */
1748c0caa2e2SCy Schubert 	if(c->type == comm_http && c->h2_session) {
1749c0caa2e2SCy Schubert 		const unsigned char *alpn;
1750c0caa2e2SCy Schubert 		unsigned int alpnlen = 0;
1751c0caa2e2SCy Schubert 		SSL_get0_alpn_selected(c->ssl, &alpn, &alpnlen);
1752c0caa2e2SCy Schubert 		if(alpnlen == 2 && memcmp("h2", alpn, 2) == 0) {
1753c0caa2e2SCy Schubert 			/* connection upgraded to HTTP2 */
1754c0caa2e2SCy Schubert 			c->tcp_do_toggle_rw = 0;
1755c0caa2e2SCy Schubert 			c->use_h2 = 1;
1756*b7c0c8c1SCy Schubert 		} else {
1757*b7c0c8c1SCy Schubert 			verbose(VERB_ALGO, "client doesn't support HTTP/2");
1758*b7c0c8c1SCy Schubert 			return 0;
1759c0caa2e2SCy Schubert 		}
1760c0caa2e2SCy Schubert 	}
17615469a995SCy Schubert #endif
1762c0caa2e2SCy Schubert 
1763b7579f77SDag-Erling Smørgrav 	/* setup listen rw correctly */
1764b7579f77SDag-Erling Smørgrav 	if(c->tcp_is_reading) {
1765b7579f77SDag-Erling Smørgrav 		if(c->ssl_shake_state != comm_ssl_shake_read)
1766b7579f77SDag-Erling Smørgrav 			comm_point_listen_for_rw(c, 1, 0);
1767b7579f77SDag-Erling Smørgrav 	} else {
17685469a995SCy Schubert 		comm_point_listen_for_rw(c, 0, 1);
1769b7579f77SDag-Erling Smørgrav 	}
1770b7579f77SDag-Erling Smørgrav 	c->ssl_shake_state = comm_ssl_shake_none;
1771b7579f77SDag-Erling Smørgrav 	return 1;
1772b7579f77SDag-Erling Smørgrav }
17738ed2b524SDag-Erling Smørgrav #endif /* HAVE_SSL */
1774b7579f77SDag-Erling Smørgrav 
1775b7579f77SDag-Erling Smørgrav /** ssl read callback on TCP */
1776b7579f77SDag-Erling Smørgrav static int
1777b7579f77SDag-Erling Smørgrav ssl_handle_read(struct comm_point* c)
1778b7579f77SDag-Erling Smørgrav {
17798ed2b524SDag-Erling Smørgrav #ifdef HAVE_SSL
1780b7579f77SDag-Erling Smørgrav 	int r;
1781b7579f77SDag-Erling Smørgrav 	if(c->ssl_shake_state != comm_ssl_shake_none) {
1782b7579f77SDag-Erling Smørgrav 		if(!ssl_handshake(c))
1783b7579f77SDag-Erling Smørgrav 			return 0;
1784b7579f77SDag-Erling Smørgrav 		if(c->ssl_shake_state != comm_ssl_shake_none)
1785b7579f77SDag-Erling Smørgrav 			return 1;
1786b7579f77SDag-Erling Smørgrav 	}
1787865f46b2SCy Schubert 	if(c->pp2_enabled && c->pp2_header_state != pp2_header_done) {
1788865f46b2SCy Schubert 		struct pp2_header* header = NULL;
1789865f46b2SCy Schubert 		size_t want_read_size = 0;
1790865f46b2SCy Schubert 		size_t current_read_size = 0;
1791865f46b2SCy Schubert 		if(c->pp2_header_state == pp2_header_none) {
1792865f46b2SCy Schubert 			want_read_size = PP2_HEADER_SIZE;
1793865f46b2SCy Schubert 			if(sldns_buffer_remaining(c->buffer)<want_read_size) {
1794865f46b2SCy Schubert 				log_err_addr("proxy_protocol: not enough "
1795865f46b2SCy Schubert 					"buffer size to read PROXYv2 header", "",
1796865f46b2SCy Schubert 					&c->repinfo.remote_addr,
1797865f46b2SCy Schubert 					c->repinfo.remote_addrlen);
1798865f46b2SCy Schubert 				return 0;
1799865f46b2SCy Schubert 			}
1800865f46b2SCy Schubert 			verbose(VERB_ALGO, "proxy_protocol: reading fixed "
1801865f46b2SCy Schubert 				"part of PROXYv2 header (len %lu)",
1802865f46b2SCy Schubert 				(unsigned long)want_read_size);
1803865f46b2SCy Schubert 			current_read_size = want_read_size;
1804865f46b2SCy Schubert 			if(c->tcp_byte_count < current_read_size) {
1805865f46b2SCy Schubert 				ERR_clear_error();
1806865f46b2SCy Schubert 				if((r=SSL_read(c->ssl, (void*)sldns_buffer_at(
1807865f46b2SCy Schubert 					c->buffer, c->tcp_byte_count),
1808865f46b2SCy Schubert 					current_read_size -
1809865f46b2SCy Schubert 					c->tcp_byte_count)) <= 0) {
1810865f46b2SCy Schubert 					int want = SSL_get_error(c->ssl, r);
1811865f46b2SCy Schubert 					if(want == SSL_ERROR_ZERO_RETURN) {
1812865f46b2SCy Schubert 						if(c->tcp_req_info)
1813865f46b2SCy Schubert 							return tcp_req_info_handle_read_close(c->tcp_req_info);
1814865f46b2SCy Schubert 						return 0; /* shutdown, closed */
1815865f46b2SCy Schubert 					} else if(want == SSL_ERROR_WANT_READ) {
1816865f46b2SCy Schubert #ifdef USE_WINSOCK
1817865f46b2SCy Schubert 						ub_winsock_tcp_wouldblock(c->ev->ev, UB_EV_READ);
1818865f46b2SCy Schubert #endif
1819865f46b2SCy Schubert 						return 1; /* read more later */
1820865f46b2SCy Schubert 					} else if(want == SSL_ERROR_WANT_WRITE) {
1821865f46b2SCy Schubert 						c->ssl_shake_state = comm_ssl_shake_hs_write;
1822865f46b2SCy Schubert 						comm_point_listen_for_rw(c, 0, 1);
1823865f46b2SCy Schubert 						return 1;
1824865f46b2SCy Schubert 					} else if(want == SSL_ERROR_SYSCALL) {
1825865f46b2SCy Schubert #ifdef ECONNRESET
1826865f46b2SCy Schubert 						if(errno == ECONNRESET && verbosity < 2)
1827865f46b2SCy Schubert 							return 0; /* silence reset by peer */
1828865f46b2SCy Schubert #endif
1829865f46b2SCy Schubert 						if(errno != 0)
1830865f46b2SCy Schubert 							log_err("SSL_read syscall: %s",
1831865f46b2SCy Schubert 								strerror(errno));
1832865f46b2SCy Schubert 						return 0;
1833865f46b2SCy Schubert 					}
1834103ba509SCy Schubert 					log_crypto_err_io("could not SSL_read",
1835103ba509SCy Schubert 						want);
1836865f46b2SCy Schubert 					return 0;
1837865f46b2SCy Schubert 				}
1838865f46b2SCy Schubert 				c->tcp_byte_count += r;
1839103ba509SCy Schubert 				sldns_buffer_skip(c->buffer, r);
1840865f46b2SCy Schubert 				if(c->tcp_byte_count != current_read_size) return 1;
1841865f46b2SCy Schubert 				c->pp2_header_state = pp2_header_init;
1842865f46b2SCy Schubert 			}
1843865f46b2SCy Schubert 		}
1844865f46b2SCy Schubert 		if(c->pp2_header_state == pp2_header_init) {
1845103ba509SCy Schubert 			int err;
1846103ba509SCy Schubert 			err = pp2_read_header(
1847103ba509SCy Schubert 				sldns_buffer_begin(c->buffer),
1848103ba509SCy Schubert 				sldns_buffer_limit(c->buffer));
1849103ba509SCy Schubert 			if(err) {
1850865f46b2SCy Schubert 				log_err("proxy_protocol: could not parse "
1851103ba509SCy Schubert 					"PROXYv2 header (%s)",
1852103ba509SCy Schubert 					pp_lookup_error(err));
1853865f46b2SCy Schubert 				return 0;
1854865f46b2SCy Schubert 			}
1855103ba509SCy Schubert 			header = (struct pp2_header*)sldns_buffer_begin(c->buffer);
1856865f46b2SCy Schubert 			want_read_size = ntohs(header->len);
1857103ba509SCy Schubert 			if(sldns_buffer_limit(c->buffer) <
1858865f46b2SCy Schubert 				PP2_HEADER_SIZE + want_read_size) {
1859865f46b2SCy Schubert 				log_err_addr("proxy_protocol: not enough "
1860865f46b2SCy Schubert 					"buffer size to read PROXYv2 header", "",
1861865f46b2SCy Schubert 					&c->repinfo.remote_addr,
1862865f46b2SCy Schubert 					c->repinfo.remote_addrlen);
1863865f46b2SCy Schubert 				return 0;
1864865f46b2SCy Schubert 			}
1865865f46b2SCy Schubert 			verbose(VERB_ALGO, "proxy_protocol: reading variable "
1866865f46b2SCy Schubert 				"part of PROXYv2 header (len %lu)",
1867865f46b2SCy Schubert 				(unsigned long)want_read_size);
1868865f46b2SCy Schubert 			current_read_size = PP2_HEADER_SIZE + want_read_size;
1869865f46b2SCy Schubert 			if(want_read_size == 0) {
1870865f46b2SCy Schubert 				/* nothing more to read; header is complete */
1871865f46b2SCy Schubert 				c->pp2_header_state = pp2_header_done;
1872865f46b2SCy Schubert 			} else if(c->tcp_byte_count < current_read_size) {
1873865f46b2SCy Schubert 				ERR_clear_error();
1874865f46b2SCy Schubert 				if((r=SSL_read(c->ssl, (void*)sldns_buffer_at(
1875865f46b2SCy Schubert 					c->buffer, c->tcp_byte_count),
1876865f46b2SCy Schubert 					current_read_size -
1877865f46b2SCy Schubert 					c->tcp_byte_count)) <= 0) {
1878865f46b2SCy Schubert 					int want = SSL_get_error(c->ssl, r);
1879865f46b2SCy Schubert 					if(want == SSL_ERROR_ZERO_RETURN) {
1880865f46b2SCy Schubert 						if(c->tcp_req_info)
1881865f46b2SCy Schubert 							return tcp_req_info_handle_read_close(c->tcp_req_info);
1882865f46b2SCy Schubert 						return 0; /* shutdown, closed */
1883865f46b2SCy Schubert 					} else if(want == SSL_ERROR_WANT_READ) {
1884865f46b2SCy Schubert #ifdef USE_WINSOCK
1885865f46b2SCy Schubert 						ub_winsock_tcp_wouldblock(c->ev->ev, UB_EV_READ);
1886865f46b2SCy Schubert #endif
1887865f46b2SCy Schubert 						return 1; /* read more later */
1888865f46b2SCy Schubert 					} else if(want == SSL_ERROR_WANT_WRITE) {
1889865f46b2SCy Schubert 						c->ssl_shake_state = comm_ssl_shake_hs_write;
1890865f46b2SCy Schubert 						comm_point_listen_for_rw(c, 0, 1);
1891865f46b2SCy Schubert 						return 1;
1892865f46b2SCy Schubert 					} else if(want == SSL_ERROR_SYSCALL) {
1893865f46b2SCy Schubert #ifdef ECONNRESET
1894865f46b2SCy Schubert 						if(errno == ECONNRESET && verbosity < 2)
1895865f46b2SCy Schubert 							return 0; /* silence reset by peer */
1896865f46b2SCy Schubert #endif
1897865f46b2SCy Schubert 						if(errno != 0)
1898865f46b2SCy Schubert 							log_err("SSL_read syscall: %s",
1899865f46b2SCy Schubert 								strerror(errno));
1900865f46b2SCy Schubert 						return 0;
1901865f46b2SCy Schubert 					}
1902103ba509SCy Schubert 					log_crypto_err_io("could not SSL_read",
1903103ba509SCy Schubert 						want);
1904865f46b2SCy Schubert 					return 0;
1905865f46b2SCy Schubert 				}
1906865f46b2SCy Schubert 				c->tcp_byte_count += r;
1907103ba509SCy Schubert 				sldns_buffer_skip(c->buffer, r);
1908865f46b2SCy Schubert 				if(c->tcp_byte_count != current_read_size) return 1;
1909865f46b2SCy Schubert 				c->pp2_header_state = pp2_header_done;
1910865f46b2SCy Schubert 			}
1911865f46b2SCy Schubert 		}
1912865f46b2SCy Schubert 		if(c->pp2_header_state != pp2_header_done || !header) {
1913865f46b2SCy Schubert 			log_err_addr("proxy_protocol: wrong state for the "
1914865f46b2SCy Schubert 				"PROXYv2 header", "", &c->repinfo.remote_addr,
1915865f46b2SCy Schubert 				c->repinfo.remote_addrlen);
1916865f46b2SCy Schubert 			return 0;
1917865f46b2SCy Schubert 		}
1918103ba509SCy Schubert 		sldns_buffer_flip(c->buffer);
1919865f46b2SCy Schubert 		if(!consume_pp2_header(c->buffer, &c->repinfo, 1)) {
1920865f46b2SCy Schubert 			log_err_addr("proxy_protocol: could not consume "
1921865f46b2SCy Schubert 				"PROXYv2 header", "", &c->repinfo.remote_addr,
1922865f46b2SCy Schubert 				c->repinfo.remote_addrlen);
1923865f46b2SCy Schubert 			return 0;
1924865f46b2SCy Schubert 		}
1925865f46b2SCy Schubert 		verbose(VERB_ALGO, "proxy_protocol: successful read of "
1926865f46b2SCy Schubert 			"PROXYv2 header");
1927865f46b2SCy Schubert 		/* Clear and reset the buffer to read the following
1928865f46b2SCy Schubert 		 * DNS packet(s). */
1929865f46b2SCy Schubert 		sldns_buffer_clear(c->buffer);
1930865f46b2SCy Schubert 		c->tcp_byte_count = 0;
1931865f46b2SCy Schubert 		return 1;
1932865f46b2SCy Schubert 	}
1933b7579f77SDag-Erling Smørgrav 	if(c->tcp_byte_count < sizeof(uint16_t)) {
1934b7579f77SDag-Erling Smørgrav 		/* read length bytes */
1935b7579f77SDag-Erling Smørgrav 		ERR_clear_error();
193617d15b25SDag-Erling Smørgrav 		if((r=SSL_read(c->ssl, (void*)sldns_buffer_at(c->buffer,
1937b7579f77SDag-Erling Smørgrav 			c->tcp_byte_count), (int)(sizeof(uint16_t) -
1938b7579f77SDag-Erling Smørgrav 			c->tcp_byte_count))) <= 0) {
1939b7579f77SDag-Erling Smørgrav 			int want = SSL_get_error(c->ssl, r);
1940b7579f77SDag-Erling Smørgrav 			if(want == SSL_ERROR_ZERO_RETURN) {
1941e86b9096SDag-Erling Smørgrav 				if(c->tcp_req_info)
1942e86b9096SDag-Erling Smørgrav 					return tcp_req_info_handle_read_close(c->tcp_req_info);
1943b7579f77SDag-Erling Smørgrav 				return 0; /* shutdown, closed */
1944b7579f77SDag-Erling Smørgrav 			} else if(want == SSL_ERROR_WANT_READ) {
19455469a995SCy Schubert #ifdef USE_WINSOCK
19463bd4df0aSDag-Erling Smørgrav 				ub_winsock_tcp_wouldblock(c->ev->ev, UB_EV_READ);
19475469a995SCy Schubert #endif
1948b7579f77SDag-Erling Smørgrav 				return 1; /* read more later */
1949b7579f77SDag-Erling Smørgrav 			} else if(want == SSL_ERROR_WANT_WRITE) {
1950b7579f77SDag-Erling Smørgrav 				c->ssl_shake_state = comm_ssl_shake_hs_write;
1951b7579f77SDag-Erling Smørgrav 				comm_point_listen_for_rw(c, 0, 1);
1952b7579f77SDag-Erling Smørgrav 				return 1;
1953b7579f77SDag-Erling Smørgrav 			} else if(want == SSL_ERROR_SYSCALL) {
1954e86b9096SDag-Erling Smørgrav #ifdef ECONNRESET
1955e86b9096SDag-Erling Smørgrav 				if(errno == ECONNRESET && verbosity < 2)
1956e86b9096SDag-Erling Smørgrav 					return 0; /* silence reset by peer */
1957e86b9096SDag-Erling Smørgrav #endif
1958b7579f77SDag-Erling Smørgrav 				if(errno != 0)
1959b7579f77SDag-Erling Smørgrav 					log_err("SSL_read syscall: %s",
1960b7579f77SDag-Erling Smørgrav 						strerror(errno));
1961b7579f77SDag-Erling Smørgrav 				return 0;
1962b7579f77SDag-Erling Smørgrav 			}
1963103ba509SCy Schubert 			log_crypto_err_io("could not SSL_read", want);
1964b7579f77SDag-Erling Smørgrav 			return 0;
1965b7579f77SDag-Erling Smørgrav 		}
1966b7579f77SDag-Erling Smørgrav 		c->tcp_byte_count += r;
19673bd4df0aSDag-Erling Smørgrav 		if(c->tcp_byte_count < sizeof(uint16_t))
1968b7579f77SDag-Erling Smørgrav 			return 1;
196917d15b25SDag-Erling Smørgrav 		if(sldns_buffer_read_u16_at(c->buffer, 0) >
197017d15b25SDag-Erling Smørgrav 			sldns_buffer_capacity(c->buffer)) {
1971b7579f77SDag-Erling Smørgrav 			verbose(VERB_QUERY, "ssl: dropped larger than buffer");
1972b7579f77SDag-Erling Smørgrav 			return 0;
1973b7579f77SDag-Erling Smørgrav 		}
197417d15b25SDag-Erling Smørgrav 		sldns_buffer_set_limit(c->buffer,
197517d15b25SDag-Erling Smørgrav 			sldns_buffer_read_u16_at(c->buffer, 0));
197617d15b25SDag-Erling Smørgrav 		if(sldns_buffer_limit(c->buffer) < LDNS_HEADER_SIZE) {
1977b7579f77SDag-Erling Smørgrav 			verbose(VERB_QUERY, "ssl: dropped bogus too short.");
1978b7579f77SDag-Erling Smørgrav 			return 0;
1979b7579f77SDag-Erling Smørgrav 		}
19803bd4df0aSDag-Erling Smørgrav 		sldns_buffer_skip(c->buffer, (ssize_t)(c->tcp_byte_count-sizeof(uint16_t)));
1981b7579f77SDag-Erling Smørgrav 		verbose(VERB_ALGO, "Reading ssl tcp query of length %d",
198217d15b25SDag-Erling Smørgrav 			(int)sldns_buffer_limit(c->buffer));
1983b7579f77SDag-Erling Smørgrav 	}
19843bd4df0aSDag-Erling Smørgrav 	if(sldns_buffer_remaining(c->buffer) > 0) {
1985b7579f77SDag-Erling Smørgrav 		ERR_clear_error();
198617d15b25SDag-Erling Smørgrav 		r = SSL_read(c->ssl, (void*)sldns_buffer_current(c->buffer),
198717d15b25SDag-Erling Smørgrav 			(int)sldns_buffer_remaining(c->buffer));
1988b7579f77SDag-Erling Smørgrav 		if(r <= 0) {
1989b7579f77SDag-Erling Smørgrav 			int want = SSL_get_error(c->ssl, r);
1990b7579f77SDag-Erling Smørgrav 			if(want == SSL_ERROR_ZERO_RETURN) {
1991e86b9096SDag-Erling Smørgrav 				if(c->tcp_req_info)
1992e86b9096SDag-Erling Smørgrav 					return tcp_req_info_handle_read_close(c->tcp_req_info);
1993b7579f77SDag-Erling Smørgrav 				return 0; /* shutdown, closed */
1994b7579f77SDag-Erling Smørgrav 			} else if(want == SSL_ERROR_WANT_READ) {
19955469a995SCy Schubert #ifdef USE_WINSOCK
19963bd4df0aSDag-Erling Smørgrav 				ub_winsock_tcp_wouldblock(c->ev->ev, UB_EV_READ);
19975469a995SCy Schubert #endif
1998b7579f77SDag-Erling Smørgrav 				return 1; /* read more later */
1999b7579f77SDag-Erling Smørgrav 			} else if(want == SSL_ERROR_WANT_WRITE) {
2000b7579f77SDag-Erling Smørgrav 				c->ssl_shake_state = comm_ssl_shake_hs_write;
2001b7579f77SDag-Erling Smørgrav 				comm_point_listen_for_rw(c, 0, 1);
2002b7579f77SDag-Erling Smørgrav 				return 1;
2003b7579f77SDag-Erling Smørgrav 			} else if(want == SSL_ERROR_SYSCALL) {
2004e86b9096SDag-Erling Smørgrav #ifdef ECONNRESET
2005e86b9096SDag-Erling Smørgrav 				if(errno == ECONNRESET && verbosity < 2)
2006e86b9096SDag-Erling Smørgrav 					return 0; /* silence reset by peer */
2007e86b9096SDag-Erling Smørgrav #endif
2008b7579f77SDag-Erling Smørgrav 				if(errno != 0)
2009b7579f77SDag-Erling Smørgrav 					log_err("SSL_read syscall: %s",
2010b7579f77SDag-Erling Smørgrav 						strerror(errno));
2011b7579f77SDag-Erling Smørgrav 				return 0;
2012b7579f77SDag-Erling Smørgrav 			}
2013103ba509SCy Schubert 			log_crypto_err_io("could not SSL_read", want);
2014b7579f77SDag-Erling Smørgrav 			return 0;
2015b7579f77SDag-Erling Smørgrav 		}
201617d15b25SDag-Erling Smørgrav 		sldns_buffer_skip(c->buffer, (ssize_t)r);
20173bd4df0aSDag-Erling Smørgrav 	}
201817d15b25SDag-Erling Smørgrav 	if(sldns_buffer_remaining(c->buffer) <= 0) {
2019b7579f77SDag-Erling Smørgrav 		tcp_callback_reader(c);
2020b7579f77SDag-Erling Smørgrav 	}
2021b7579f77SDag-Erling Smørgrav 	return 1;
20228ed2b524SDag-Erling Smørgrav #else
20238ed2b524SDag-Erling Smørgrav 	(void)c;
20248ed2b524SDag-Erling Smørgrav 	return 0;
20258ed2b524SDag-Erling Smørgrav #endif /* HAVE_SSL */
2026b7579f77SDag-Erling Smørgrav }
2027b7579f77SDag-Erling Smørgrav 
2028b7579f77SDag-Erling Smørgrav /** ssl write callback on TCP */
2029b7579f77SDag-Erling Smørgrav static int
2030b7579f77SDag-Erling Smørgrav ssl_handle_write(struct comm_point* c)
2031b7579f77SDag-Erling Smørgrav {
20328ed2b524SDag-Erling Smørgrav #ifdef HAVE_SSL
2033b7579f77SDag-Erling Smørgrav 	int r;
2034b7579f77SDag-Erling Smørgrav 	if(c->ssl_shake_state != comm_ssl_shake_none) {
2035b7579f77SDag-Erling Smørgrav 		if(!ssl_handshake(c))
2036b7579f77SDag-Erling Smørgrav 			return 0;
2037b7579f77SDag-Erling Smørgrav 		if(c->ssl_shake_state != comm_ssl_shake_none)
2038b7579f77SDag-Erling Smørgrav 			return 1;
2039b7579f77SDag-Erling Smørgrav 	}
2040b7579f77SDag-Erling Smørgrav 	/* ignore return, if fails we may simply block */
20410eefd307SCy Schubert 	(void)SSL_set_mode(c->ssl, (long)SSL_MODE_ENABLE_PARTIAL_WRITE);
2042369c6923SCy Schubert 	if((c->tcp_write_and_read?c->tcp_write_byte_count:c->tcp_byte_count) < sizeof(uint16_t)) {
2043369c6923SCy Schubert 		uint16_t len = htons(c->tcp_write_and_read?c->tcp_write_pkt_len:sldns_buffer_limit(c->buffer));
2044b7579f77SDag-Erling Smørgrav 		ERR_clear_error();
2045369c6923SCy Schubert 		if(c->tcp_write_and_read) {
2046369c6923SCy Schubert 			if(c->tcp_write_pkt_len + 2 < LDNS_RR_BUF_SIZE) {
2047369c6923SCy Schubert 				/* combine the tcp length and the query for
2048369c6923SCy Schubert 				 * write, this emulates writev */
2049369c6923SCy Schubert 				uint8_t buf[LDNS_RR_BUF_SIZE];
2050369c6923SCy Schubert 				memmove(buf, &len, sizeof(uint16_t));
2051369c6923SCy Schubert 				memmove(buf+sizeof(uint16_t),
2052369c6923SCy Schubert 					c->tcp_write_pkt,
2053369c6923SCy Schubert 					c->tcp_write_pkt_len);
2054369c6923SCy Schubert 				r = SSL_write(c->ssl,
2055369c6923SCy Schubert 					(void*)(buf+c->tcp_write_byte_count),
2056369c6923SCy Schubert 					c->tcp_write_pkt_len + 2 -
2057369c6923SCy Schubert 					c->tcp_write_byte_count);
2058369c6923SCy Schubert 			} else {
2059369c6923SCy Schubert 				r = SSL_write(c->ssl,
2060369c6923SCy Schubert 					(void*)(((uint8_t*)&len)+c->tcp_write_byte_count),
2061369c6923SCy Schubert 					(int)(sizeof(uint16_t)-c->tcp_write_byte_count));
2062369c6923SCy Schubert 			}
2063369c6923SCy Schubert 		} else if(sizeof(uint16_t)+sldns_buffer_remaining(c->buffer) <
20640fb34990SDag-Erling Smørgrav 			LDNS_RR_BUF_SIZE) {
20650fb34990SDag-Erling Smørgrav 			/* combine the tcp length and the query for write,
20660fb34990SDag-Erling Smørgrav 			 * this emulates writev */
20670fb34990SDag-Erling Smørgrav 			uint8_t buf[LDNS_RR_BUF_SIZE];
20680fb34990SDag-Erling Smørgrav 			memmove(buf, &len, sizeof(uint16_t));
20690fb34990SDag-Erling Smørgrav 			memmove(buf+sizeof(uint16_t),
20700fb34990SDag-Erling Smørgrav 				sldns_buffer_current(c->buffer),
20710fb34990SDag-Erling Smørgrav 				sldns_buffer_remaining(c->buffer));
20720fb34990SDag-Erling Smørgrav 			r = SSL_write(c->ssl, (void*)(buf+c->tcp_byte_count),
20730fb34990SDag-Erling Smørgrav 				(int)(sizeof(uint16_t)+
20740fb34990SDag-Erling Smørgrav 				sldns_buffer_remaining(c->buffer)
20750fb34990SDag-Erling Smørgrav 				- c->tcp_byte_count));
20760fb34990SDag-Erling Smørgrav 		} else {
2077b7579f77SDag-Erling Smørgrav 			r = SSL_write(c->ssl,
2078b7579f77SDag-Erling Smørgrav 				(void*)(((uint8_t*)&len)+c->tcp_byte_count),
2079b7579f77SDag-Erling Smørgrav 				(int)(sizeof(uint16_t)-c->tcp_byte_count));
20800fb34990SDag-Erling Smørgrav 		}
2081b7579f77SDag-Erling Smørgrav 		if(r <= 0) {
2082b7579f77SDag-Erling Smørgrav 			int want = SSL_get_error(c->ssl, r);
2083b7579f77SDag-Erling Smørgrav 			if(want == SSL_ERROR_ZERO_RETURN) {
2084b7579f77SDag-Erling Smørgrav 				return 0; /* closed */
2085b7579f77SDag-Erling Smørgrav 			} else if(want == SSL_ERROR_WANT_READ) {
2086e86b9096SDag-Erling Smørgrav 				c->ssl_shake_state = comm_ssl_shake_hs_read;
2087b7579f77SDag-Erling Smørgrav 				comm_point_listen_for_rw(c, 1, 0);
2088b7579f77SDag-Erling Smørgrav 				return 1; /* wait for read condition */
2089b7579f77SDag-Erling Smørgrav 			} else if(want == SSL_ERROR_WANT_WRITE) {
20905469a995SCy Schubert #ifdef USE_WINSOCK
20913bd4df0aSDag-Erling Smørgrav 				ub_winsock_tcp_wouldblock(c->ev->ev, UB_EV_WRITE);
20925469a995SCy Schubert #endif
2093b7579f77SDag-Erling Smørgrav 				return 1; /* write more later */
2094b7579f77SDag-Erling Smørgrav 			} else if(want == SSL_ERROR_SYSCALL) {
2095e86b9096SDag-Erling Smørgrav #ifdef EPIPE
2096e86b9096SDag-Erling Smørgrav 				if(errno == EPIPE && verbosity < 2)
2097e86b9096SDag-Erling Smørgrav 					return 0; /* silence 'broken pipe' */
2098e86b9096SDag-Erling Smørgrav #endif
2099b7579f77SDag-Erling Smørgrav 				if(errno != 0)
2100b7579f77SDag-Erling Smørgrav 					log_err("SSL_write syscall: %s",
2101b7579f77SDag-Erling Smørgrav 						strerror(errno));
2102b7579f77SDag-Erling Smørgrav 				return 0;
2103b7579f77SDag-Erling Smørgrav 			}
2104103ba509SCy Schubert 			log_crypto_err_io("could not SSL_write", want);
2105b7579f77SDag-Erling Smørgrav 			return 0;
2106b7579f77SDag-Erling Smørgrav 		}
2107369c6923SCy Schubert 		if(c->tcp_write_and_read) {
2108369c6923SCy Schubert 			c->tcp_write_byte_count += r;
2109369c6923SCy Schubert 			if(c->tcp_write_byte_count < sizeof(uint16_t))
2110369c6923SCy Schubert 				return 1;
2111369c6923SCy Schubert 		} else {
2112b7579f77SDag-Erling Smørgrav 			c->tcp_byte_count += r;
2113b7579f77SDag-Erling Smørgrav 			if(c->tcp_byte_count < sizeof(uint16_t))
2114b7579f77SDag-Erling Smørgrav 				return 1;
211517d15b25SDag-Erling Smørgrav 			sldns_buffer_set_position(c->buffer, c->tcp_byte_count -
2116b7579f77SDag-Erling Smørgrav 				sizeof(uint16_t));
2117369c6923SCy Schubert 		}
2118369c6923SCy Schubert 		if((!c->tcp_write_and_read && sldns_buffer_remaining(c->buffer) == 0) || (c->tcp_write_and_read && c->tcp_write_byte_count == c->tcp_write_pkt_len + 2)) {
2119b7579f77SDag-Erling Smørgrav 			tcp_callback_writer(c);
2120b7579f77SDag-Erling Smørgrav 			return 1;
2121b7579f77SDag-Erling Smørgrav 		}
2122b7579f77SDag-Erling Smørgrav 	}
2123369c6923SCy Schubert 	log_assert(c->tcp_write_and_read || sldns_buffer_remaining(c->buffer) > 0);
2124369c6923SCy Schubert 	log_assert(!c->tcp_write_and_read || c->tcp_write_byte_count < c->tcp_write_pkt_len + 2);
2125b7579f77SDag-Erling Smørgrav 	ERR_clear_error();
2126369c6923SCy Schubert 	if(c->tcp_write_and_read) {
2127369c6923SCy Schubert 		r = SSL_write(c->ssl, (void*)(c->tcp_write_pkt + c->tcp_write_byte_count - 2),
2128369c6923SCy Schubert 			(int)(c->tcp_write_pkt_len + 2 - c->tcp_write_byte_count));
2129369c6923SCy Schubert 	} else {
213017d15b25SDag-Erling Smørgrav 		r = SSL_write(c->ssl, (void*)sldns_buffer_current(c->buffer),
213117d15b25SDag-Erling Smørgrav 			(int)sldns_buffer_remaining(c->buffer));
2132369c6923SCy Schubert 	}
2133b7579f77SDag-Erling Smørgrav 	if(r <= 0) {
2134b7579f77SDag-Erling Smørgrav 		int want = SSL_get_error(c->ssl, r);
2135b7579f77SDag-Erling Smørgrav 		if(want == SSL_ERROR_ZERO_RETURN) {
2136b7579f77SDag-Erling Smørgrav 			return 0; /* closed */
2137b7579f77SDag-Erling Smørgrav 		} else if(want == SSL_ERROR_WANT_READ) {
2138e86b9096SDag-Erling Smørgrav 			c->ssl_shake_state = comm_ssl_shake_hs_read;
2139b7579f77SDag-Erling Smørgrav 			comm_point_listen_for_rw(c, 1, 0);
2140b7579f77SDag-Erling Smørgrav 			return 1; /* wait for read condition */
2141b7579f77SDag-Erling Smørgrav 		} else if(want == SSL_ERROR_WANT_WRITE) {
21425469a995SCy Schubert #ifdef USE_WINSOCK
21433bd4df0aSDag-Erling Smørgrav 			ub_winsock_tcp_wouldblock(c->ev->ev, UB_EV_WRITE);
21445469a995SCy Schubert #endif
2145b7579f77SDag-Erling Smørgrav 			return 1; /* write more later */
2146b7579f77SDag-Erling Smørgrav 		} else if(want == SSL_ERROR_SYSCALL) {
2147e86b9096SDag-Erling Smørgrav #ifdef EPIPE
2148e86b9096SDag-Erling Smørgrav 			if(errno == EPIPE && verbosity < 2)
2149e86b9096SDag-Erling Smørgrav 				return 0; /* silence 'broken pipe' */
2150e86b9096SDag-Erling Smørgrav #endif
2151b7579f77SDag-Erling Smørgrav 			if(errno != 0)
2152b7579f77SDag-Erling Smørgrav 				log_err("SSL_write syscall: %s",
2153b7579f77SDag-Erling Smørgrav 					strerror(errno));
2154b7579f77SDag-Erling Smørgrav 			return 0;
2155b7579f77SDag-Erling Smørgrav 		}
2156103ba509SCy Schubert 		log_crypto_err_io("could not SSL_write", want);
2157b7579f77SDag-Erling Smørgrav 		return 0;
2158b7579f77SDag-Erling Smørgrav 	}
2159369c6923SCy Schubert 	if(c->tcp_write_and_read) {
2160369c6923SCy Schubert 		c->tcp_write_byte_count += r;
2161369c6923SCy Schubert 	} else {
216217d15b25SDag-Erling Smørgrav 		sldns_buffer_skip(c->buffer, (ssize_t)r);
2163369c6923SCy Schubert 	}
2164b7579f77SDag-Erling Smørgrav 
2165369c6923SCy Schubert 	if((!c->tcp_write_and_read && sldns_buffer_remaining(c->buffer) == 0) || (c->tcp_write_and_read && c->tcp_write_byte_count == c->tcp_write_pkt_len + 2)) {
2166b7579f77SDag-Erling Smørgrav 		tcp_callback_writer(c);
2167b7579f77SDag-Erling Smørgrav 	}
2168b7579f77SDag-Erling Smørgrav 	return 1;
21698ed2b524SDag-Erling Smørgrav #else
21708ed2b524SDag-Erling Smørgrav 	(void)c;
21718ed2b524SDag-Erling Smørgrav 	return 0;
21728ed2b524SDag-Erling Smørgrav #endif /* HAVE_SSL */
2173b7579f77SDag-Erling Smørgrav }
2174b7579f77SDag-Erling Smørgrav 
2175b7579f77SDag-Erling Smørgrav /** handle ssl tcp connection with dns contents */
2176b7579f77SDag-Erling Smørgrav static int
2177369c6923SCy Schubert ssl_handle_it(struct comm_point* c, int is_write)
2178b7579f77SDag-Erling Smørgrav {
2179369c6923SCy Schubert 	/* handle case where renegotiation wants read during write call
2180369c6923SCy Schubert 	 * or write during read calls */
2181369c6923SCy Schubert 	if(is_write && c->ssl_shake_state == comm_ssl_shake_hs_write)
2182369c6923SCy Schubert 		return ssl_handle_read(c);
2183369c6923SCy Schubert 	else if(!is_write && c->ssl_shake_state == comm_ssl_shake_hs_read)
2184369c6923SCy Schubert 		return ssl_handle_write(c);
2185369c6923SCy Schubert 	/* handle read events for read operation and write events for a
2186369c6923SCy Schubert 	 * write operation */
2187369c6923SCy Schubert 	else if(!is_write)
2188b7579f77SDag-Erling Smørgrav 		return ssl_handle_read(c);
2189b7579f77SDag-Erling Smørgrav 	return ssl_handle_write(c);
2190b7579f77SDag-Erling Smørgrav }
2191b7579f77SDag-Erling Smørgrav 
2192865f46b2SCy Schubert /**
2193865f46b2SCy Schubert  * Handle tcp reading callback.
2194b7579f77SDag-Erling Smørgrav  * @param fd: file descriptor of socket.
2195b7579f77SDag-Erling Smørgrav  * @param c: comm point to read from into buffer.
2196b7579f77SDag-Erling Smørgrav  * @param short_ok: if true, very short packets are OK (for comm_local).
2197b7579f77SDag-Erling Smørgrav  * @return: 0 on error
2198b7579f77SDag-Erling Smørgrav  */
2199b7579f77SDag-Erling Smørgrav static int
2200b7579f77SDag-Erling Smørgrav comm_point_tcp_handle_read(int fd, struct comm_point* c, int short_ok)
2201b7579f77SDag-Erling Smørgrav {
2202b7579f77SDag-Erling Smørgrav 	ssize_t r;
2203865f46b2SCy Schubert 	int recv_initial = 0;
2204b7579f77SDag-Erling Smørgrav 	log_assert(c->type == comm_tcp || c->type == comm_local);
2205b7579f77SDag-Erling Smørgrav 	if(c->ssl)
2206369c6923SCy Schubert 		return ssl_handle_it(c, 0);
2207369c6923SCy Schubert 	if(!c->tcp_is_reading && !c->tcp_write_and_read)
2208b7579f77SDag-Erling Smørgrav 		return 0;
2209b7579f77SDag-Erling Smørgrav 
2210b7579f77SDag-Erling Smørgrav 	log_assert(fd != -1);
2211865f46b2SCy Schubert 	if(c->pp2_enabled && c->pp2_header_state != pp2_header_done) {
2212865f46b2SCy Schubert 		struct pp2_header* header = NULL;
2213865f46b2SCy Schubert 		size_t want_read_size = 0;
2214865f46b2SCy Schubert 		size_t current_read_size = 0;
2215865f46b2SCy Schubert 		if(c->pp2_header_state == pp2_header_none) {
2216865f46b2SCy Schubert 			want_read_size = PP2_HEADER_SIZE;
2217865f46b2SCy Schubert 			if(sldns_buffer_remaining(c->buffer)<want_read_size) {
2218865f46b2SCy Schubert 				log_err_addr("proxy_protocol: not enough "
2219865f46b2SCy Schubert 					"buffer size to read PROXYv2 header", "",
2220865f46b2SCy Schubert 					&c->repinfo.remote_addr,
2221865f46b2SCy Schubert 					c->repinfo.remote_addrlen);
2222865f46b2SCy Schubert 				return 0;
2223865f46b2SCy Schubert 			}
2224865f46b2SCy Schubert 			verbose(VERB_ALGO, "proxy_protocol: reading fixed "
2225865f46b2SCy Schubert 				"part of PROXYv2 header (len %lu)",
2226865f46b2SCy Schubert 				(unsigned long)want_read_size);
2227865f46b2SCy Schubert 			current_read_size = want_read_size;
2228865f46b2SCy Schubert 			if(c->tcp_byte_count < current_read_size) {
2229865f46b2SCy Schubert 				r = recv(fd, (void*)sldns_buffer_at(c->buffer,
2230865f46b2SCy Schubert 					c->tcp_byte_count),
2231865f46b2SCy Schubert 					current_read_size-c->tcp_byte_count, MSG_DONTWAIT);
223264d318eaSCy Schubert 				if(r == 0) {
223364d318eaSCy Schubert 					if(c->tcp_req_info)
223464d318eaSCy Schubert 						return tcp_req_info_handle_read_close(c->tcp_req_info);
223564d318eaSCy Schubert 					return 0;
223664d318eaSCy Schubert 				} else if(r == -1) {
2237865f46b2SCy Schubert 					goto recv_error_initial;
2238865f46b2SCy Schubert 				}
2239865f46b2SCy Schubert 				c->tcp_byte_count += r;
2240103ba509SCy Schubert 				sldns_buffer_skip(c->buffer, r);
2241865f46b2SCy Schubert 				if(c->tcp_byte_count != current_read_size) return 1;
2242865f46b2SCy Schubert 				c->pp2_header_state = pp2_header_init;
2243865f46b2SCy Schubert 			}
2244865f46b2SCy Schubert 		}
2245865f46b2SCy Schubert 		if(c->pp2_header_state == pp2_header_init) {
2246103ba509SCy Schubert 			int err;
2247103ba509SCy Schubert 			err = pp2_read_header(
2248103ba509SCy Schubert 				sldns_buffer_begin(c->buffer),
2249103ba509SCy Schubert 				sldns_buffer_limit(c->buffer));
2250103ba509SCy Schubert 			if(err) {
2251865f46b2SCy Schubert 				log_err("proxy_protocol: could not parse "
2252103ba509SCy Schubert 					"PROXYv2 header (%s)",
2253103ba509SCy Schubert 					pp_lookup_error(err));
2254865f46b2SCy Schubert 				return 0;
2255865f46b2SCy Schubert 			}
2256103ba509SCy Schubert 			header = (struct pp2_header*)sldns_buffer_begin(c->buffer);
2257865f46b2SCy Schubert 			want_read_size = ntohs(header->len);
2258103ba509SCy Schubert 			if(sldns_buffer_limit(c->buffer) <
2259865f46b2SCy Schubert 				PP2_HEADER_SIZE + want_read_size) {
2260865f46b2SCy Schubert 				log_err_addr("proxy_protocol: not enough "
2261865f46b2SCy Schubert 					"buffer size to read PROXYv2 header", "",
2262865f46b2SCy Schubert 					&c->repinfo.remote_addr,
2263865f46b2SCy Schubert 					c->repinfo.remote_addrlen);
2264865f46b2SCy Schubert 				return 0;
2265865f46b2SCy Schubert 			}
2266865f46b2SCy Schubert 			verbose(VERB_ALGO, "proxy_protocol: reading variable "
2267865f46b2SCy Schubert 				"part of PROXYv2 header (len %lu)",
2268865f46b2SCy Schubert 				(unsigned long)want_read_size);
2269865f46b2SCy Schubert 			current_read_size = PP2_HEADER_SIZE + want_read_size;
2270865f46b2SCy Schubert 			if(want_read_size == 0) {
2271865f46b2SCy Schubert 				/* nothing more to read; header is complete */
2272865f46b2SCy Schubert 				c->pp2_header_state = pp2_header_done;
2273865f46b2SCy Schubert 			} else if(c->tcp_byte_count < current_read_size) {
2274865f46b2SCy Schubert 				r = recv(fd, (void*)sldns_buffer_at(c->buffer,
2275865f46b2SCy Schubert 					c->tcp_byte_count),
2276865f46b2SCy Schubert 					current_read_size-c->tcp_byte_count, MSG_DONTWAIT);
2277865f46b2SCy Schubert 				if(r == 0) {
2278865f46b2SCy Schubert 					if(c->tcp_req_info)
2279865f46b2SCy Schubert 						return tcp_req_info_handle_read_close(c->tcp_req_info);
2280865f46b2SCy Schubert 					return 0;
2281865f46b2SCy Schubert 				} else if(r == -1) {
2282865f46b2SCy Schubert 					goto recv_error;
2283865f46b2SCy Schubert 				}
2284865f46b2SCy Schubert 				c->tcp_byte_count += r;
2285103ba509SCy Schubert 				sldns_buffer_skip(c->buffer, r);
2286865f46b2SCy Schubert 				if(c->tcp_byte_count != current_read_size) return 1;
2287865f46b2SCy Schubert 				c->pp2_header_state = pp2_header_done;
2288865f46b2SCy Schubert 			}
2289865f46b2SCy Schubert 		}
2290865f46b2SCy Schubert 		if(c->pp2_header_state != pp2_header_done || !header) {
2291865f46b2SCy Schubert 			log_err_addr("proxy_protocol: wrong state for the "
2292865f46b2SCy Schubert 				"PROXYv2 header", "", &c->repinfo.remote_addr,
2293865f46b2SCy Schubert 				c->repinfo.remote_addrlen);
2294865f46b2SCy Schubert 			return 0;
2295865f46b2SCy Schubert 		}
2296103ba509SCy Schubert 		sldns_buffer_flip(c->buffer);
2297865f46b2SCy Schubert 		if(!consume_pp2_header(c->buffer, &c->repinfo, 1)) {
2298865f46b2SCy Schubert 			log_err_addr("proxy_protocol: could not consume "
2299865f46b2SCy Schubert 				"PROXYv2 header", "", &c->repinfo.remote_addr,
2300865f46b2SCy Schubert 				c->repinfo.remote_addrlen);
2301865f46b2SCy Schubert 			return 0;
2302865f46b2SCy Schubert 		}
2303865f46b2SCy Schubert 		verbose(VERB_ALGO, "proxy_protocol: successful read of "
2304865f46b2SCy Schubert 			"PROXYv2 header");
2305865f46b2SCy Schubert 		/* Clear and reset the buffer to read the following
2306865f46b2SCy Schubert 		    * DNS packet(s). */
2307865f46b2SCy Schubert 		sldns_buffer_clear(c->buffer);
2308865f46b2SCy Schubert 		c->tcp_byte_count = 0;
2309865f46b2SCy Schubert 		return 1;
2310865f46b2SCy Schubert 	}
2311865f46b2SCy Schubert 
2312865f46b2SCy Schubert 	if(c->tcp_byte_count < sizeof(uint16_t)) {
2313865f46b2SCy Schubert 		/* read length bytes */
2314865f46b2SCy Schubert 		r = recv(fd,(void*)sldns_buffer_at(c->buffer,c->tcp_byte_count),
2315865f46b2SCy Schubert 			sizeof(uint16_t)-c->tcp_byte_count, MSG_DONTWAIT);
2316865f46b2SCy Schubert 		if(r == 0) {
2317865f46b2SCy Schubert 			if(c->tcp_req_info)
2318865f46b2SCy Schubert 				return tcp_req_info_handle_read_close(c->tcp_req_info);
2319865f46b2SCy Schubert 			return 0;
2320865f46b2SCy Schubert 		} else if(r == -1) {
2321865f46b2SCy Schubert 			if(c->pp2_enabled) goto recv_error;
2322865f46b2SCy Schubert 			goto recv_error_initial;
2323865f46b2SCy Schubert 		}
2324865f46b2SCy Schubert 		c->tcp_byte_count += r;
2325865f46b2SCy Schubert 		if(c->tcp_byte_count != sizeof(uint16_t))
2326865f46b2SCy Schubert 			return 1;
2327865f46b2SCy Schubert 		if(sldns_buffer_read_u16_at(c->buffer, 0) >
2328865f46b2SCy Schubert 			sldns_buffer_capacity(c->buffer)) {
2329865f46b2SCy Schubert 			verbose(VERB_QUERY, "tcp: dropped larger than buffer");
2330865f46b2SCy Schubert 			return 0;
2331865f46b2SCy Schubert 		}
2332865f46b2SCy Schubert 		sldns_buffer_set_limit(c->buffer,
2333865f46b2SCy Schubert 			sldns_buffer_read_u16_at(c->buffer, 0));
2334865f46b2SCy Schubert 		if(!short_ok &&
2335865f46b2SCy Schubert 			sldns_buffer_limit(c->buffer) < LDNS_HEADER_SIZE) {
2336865f46b2SCy Schubert 			verbose(VERB_QUERY, "tcp: dropped bogus too short.");
2337865f46b2SCy Schubert 			return 0;
2338865f46b2SCy Schubert 		}
2339865f46b2SCy Schubert 		verbose(VERB_ALGO, "Reading tcp query of length %d",
2340865f46b2SCy Schubert 			(int)sldns_buffer_limit(c->buffer));
2341865f46b2SCy Schubert 	}
2342865f46b2SCy Schubert 
2343865f46b2SCy Schubert 	if(sldns_buffer_remaining(c->buffer) == 0)
2344865f46b2SCy Schubert 		log_err("in comm_point_tcp_handle_read buffer_remaining is "
2345865f46b2SCy Schubert 			"not > 0 as expected, continuing with (harmless) 0 "
2346865f46b2SCy Schubert 			"length recv");
2347865f46b2SCy Schubert 	r = recv(fd, (void*)sldns_buffer_current(c->buffer),
2348865f46b2SCy Schubert 		sldns_buffer_remaining(c->buffer), MSG_DONTWAIT);
2349865f46b2SCy Schubert 	if(r == 0) {
2350865f46b2SCy Schubert 		if(c->tcp_req_info)
2351865f46b2SCy Schubert 			return tcp_req_info_handle_read_close(c->tcp_req_info);
2352865f46b2SCy Schubert 		return 0;
2353865f46b2SCy Schubert 	} else if(r == -1) {
2354865f46b2SCy Schubert 		goto recv_error;
2355865f46b2SCy Schubert 	}
2356865f46b2SCy Schubert 	sldns_buffer_skip(c->buffer, r);
2357865f46b2SCy Schubert 	if(sldns_buffer_remaining(c->buffer) <= 0) {
2358865f46b2SCy Schubert 		tcp_callback_reader(c);
2359865f46b2SCy Schubert 	}
2360865f46b2SCy Schubert 	return 1;
2361865f46b2SCy Schubert 
2362865f46b2SCy Schubert recv_error_initial:
2363865f46b2SCy Schubert 	recv_initial = 1;
2364865f46b2SCy Schubert recv_error:
2365b7579f77SDag-Erling Smørgrav #ifndef USE_WINSOCK
2366b7579f77SDag-Erling Smørgrav 	if(errno == EINTR || errno == EAGAIN)
2367b7579f77SDag-Erling Smørgrav 		return 1;
2368865f46b2SCy Schubert 	if(recv_initial) {
2369b7579f77SDag-Erling Smørgrav #ifdef ECONNRESET
2370b7579f77SDag-Erling Smørgrav 		if(errno == ECONNRESET && verbosity < 2)
2371b7579f77SDag-Erling Smørgrav 			return 0; /* silence reset by peer */
2372b7579f77SDag-Erling Smørgrav #endif
23735469a995SCy Schubert #ifdef ECONNREFUSED
23745469a995SCy Schubert 		if(errno == ECONNREFUSED && verbosity < 2)
23755469a995SCy Schubert 			return 0; /* silence reset by peer */
23765469a995SCy Schubert #endif
2377f44e67d1SCy Schubert #ifdef ENETUNREACH
2378f44e67d1SCy Schubert 		if(errno == ENETUNREACH && verbosity < 2)
2379f44e67d1SCy Schubert 			return 0; /* silence it */
2380f44e67d1SCy Schubert #endif
2381f44e67d1SCy Schubert #ifdef EHOSTDOWN
2382f44e67d1SCy Schubert 		if(errno == EHOSTDOWN && verbosity < 2)
2383f44e67d1SCy Schubert 			return 0; /* silence it */
2384f44e67d1SCy Schubert #endif
2385f44e67d1SCy Schubert #ifdef EHOSTUNREACH
2386f44e67d1SCy Schubert 		if(errno == EHOSTUNREACH && verbosity < 2)
2387f44e67d1SCy Schubert 			return 0; /* silence it */
2388f44e67d1SCy Schubert #endif
2389f44e67d1SCy Schubert #ifdef ENETDOWN
2390f44e67d1SCy Schubert 		if(errno == ENETDOWN && verbosity < 2)
2391f44e67d1SCy Schubert 			return 0; /* silence it */
2392f44e67d1SCy Schubert #endif
2393f44e67d1SCy Schubert #ifdef EACCES
2394f44e67d1SCy Schubert 		if(errno == EACCES && verbosity < 2)
2395f44e67d1SCy Schubert 			return 0; /* silence it */
2396f44e67d1SCy Schubert #endif
2397f44e67d1SCy Schubert #ifdef ENOTCONN
2398f44e67d1SCy Schubert 		if(errno == ENOTCONN) {
2399865f46b2SCy Schubert 			log_err_addr("read (in tcp s) failed and this "
2400865f46b2SCy Schubert 				"could be because TCP Fast Open is "
2401865f46b2SCy Schubert 				"enabled [--disable-tfo-client "
2402865f46b2SCy Schubert 				"--disable-tfo-server] but does not "
2403865f46b2SCy Schubert 				"work", sock_strerror(errno),
2404865f46b2SCy Schubert 				&c->repinfo.remote_addr,
2405865f46b2SCy Schubert 				c->repinfo.remote_addrlen);
2406f44e67d1SCy Schubert 			return 0;
2407f44e67d1SCy Schubert 		}
2408f44e67d1SCy Schubert #endif
2409865f46b2SCy Schubert 	}
2410b7579f77SDag-Erling Smørgrav #else /* USE_WINSOCK */
2411865f46b2SCy Schubert 	if(recv_initial) {
24125469a995SCy Schubert 		if(WSAGetLastError() == WSAECONNREFUSED && verbosity < 2)
24135469a995SCy Schubert 			return 0;
24145469a995SCy Schubert 		if(WSAGetLastError() == WSAEHOSTDOWN && verbosity < 2)
24155469a995SCy Schubert 			return 0;
24165469a995SCy Schubert 		if(WSAGetLastError() == WSAEHOSTUNREACH && verbosity < 2)
24175469a995SCy Schubert 			return 0;
24185469a995SCy Schubert 		if(WSAGetLastError() == WSAENETDOWN && verbosity < 2)
24195469a995SCy Schubert 			return 0;
24205469a995SCy Schubert 		if(WSAGetLastError() == WSAENETUNREACH && verbosity < 2)
24215469a995SCy Schubert 			return 0;
2422865f46b2SCy Schubert 	}
2423b7579f77SDag-Erling Smørgrav 	if(WSAGetLastError() == WSAECONNRESET)
2424b7579f77SDag-Erling Smørgrav 		return 0;
2425b7579f77SDag-Erling Smørgrav 	if(WSAGetLastError() == WSAEINPROGRESS)
2426b7579f77SDag-Erling Smørgrav 		return 1;
2427b7579f77SDag-Erling Smørgrav 	if(WSAGetLastError() == WSAEWOULDBLOCK) {
2428e2d15004SDag-Erling Smørgrav 		ub_winsock_tcp_wouldblock(c->ev->ev,
2429e2d15004SDag-Erling Smørgrav 			UB_EV_READ);
2430b7579f77SDag-Erling Smørgrav 		return 1;
2431b7579f77SDag-Erling Smørgrav 	}
2432b7579f77SDag-Erling Smørgrav #endif
2433c0caa2e2SCy Schubert 	log_err_addr("read (in tcp s)", sock_strerror(errno),
2434865f46b2SCy Schubert 		&c->repinfo.remote_addr, c->repinfo.remote_addrlen);
2435b7579f77SDag-Erling Smørgrav 	return 0;
2436b7579f77SDag-Erling Smørgrav }
2437b7579f77SDag-Erling Smørgrav 
2438b7579f77SDag-Erling Smørgrav /**
2439b7579f77SDag-Erling Smørgrav  * Handle tcp writing callback.
2440b7579f77SDag-Erling Smørgrav  * @param fd: file descriptor of socket.
2441b7579f77SDag-Erling Smørgrav  * @param c: comm point to write buffer out of.
2442b7579f77SDag-Erling Smørgrav  * @return: 0 on error
2443b7579f77SDag-Erling Smørgrav  */
2444b7579f77SDag-Erling Smørgrav static int
2445b7579f77SDag-Erling Smørgrav comm_point_tcp_handle_write(int fd, struct comm_point* c)
2446b7579f77SDag-Erling Smørgrav {
2447b7579f77SDag-Erling Smørgrav 	ssize_t r;
244865b390aaSDag-Erling Smørgrav 	struct sldns_buffer *buffer;
2449b7579f77SDag-Erling Smørgrav 	log_assert(c->type == comm_tcp);
245065b390aaSDag-Erling Smørgrav #ifdef USE_DNSCRYPT
245165b390aaSDag-Erling Smørgrav 	buffer = c->dnscrypt_buffer;
245265b390aaSDag-Erling Smørgrav #else
245365b390aaSDag-Erling Smørgrav 	buffer = c->buffer;
245465b390aaSDag-Erling Smørgrav #endif
2455369c6923SCy Schubert 	if(c->tcp_is_reading && !c->ssl && !c->tcp_write_and_read)
2456b7579f77SDag-Erling Smørgrav 		return 0;
2457b7579f77SDag-Erling Smørgrav 	log_assert(fd != -1);
2458369c6923SCy Schubert 	if(((!c->tcp_write_and_read && c->tcp_byte_count == 0) || (c->tcp_write_and_read && c->tcp_write_byte_count == 0)) && c->tcp_check_nb_connect) {
2459b7579f77SDag-Erling Smørgrav 		/* check for pending error from nonblocking connect */
2460b7579f77SDag-Erling Smørgrav 		/* from Stevens, unix network programming, vol1, 3rd ed, p450*/
2461b7579f77SDag-Erling Smørgrav 		int error = 0;
2462b7579f77SDag-Erling Smørgrav 		socklen_t len = (socklen_t)sizeof(error);
2463b7579f77SDag-Erling Smørgrav 		if(getsockopt(fd, SOL_SOCKET, SO_ERROR, (void*)&error,
2464b7579f77SDag-Erling Smørgrav 			&len) < 0){
2465b7579f77SDag-Erling Smørgrav #ifndef USE_WINSOCK
2466b7579f77SDag-Erling Smørgrav 			error = errno; /* on solaris errno is error */
2467b7579f77SDag-Erling Smørgrav #else /* USE_WINSOCK */
2468b7579f77SDag-Erling Smørgrav 			error = WSAGetLastError();
2469b7579f77SDag-Erling Smørgrav #endif
2470b7579f77SDag-Erling Smørgrav 		}
2471b7579f77SDag-Erling Smørgrav #ifndef USE_WINSOCK
2472b7579f77SDag-Erling Smørgrav #if defined(EINPROGRESS) && defined(EWOULDBLOCK)
2473b7579f77SDag-Erling Smørgrav 		if(error == EINPROGRESS || error == EWOULDBLOCK)
2474b7579f77SDag-Erling Smørgrav 			return 1; /* try again later */
2475b7579f77SDag-Erling Smørgrav 		else
2476b7579f77SDag-Erling Smørgrav #endif
2477b7579f77SDag-Erling Smørgrav 		if(error != 0 && verbosity < 2)
2478b7579f77SDag-Erling Smørgrav 			return 0; /* silence lots of chatter in the logs */
2479b7579f77SDag-Erling Smørgrav                 else if(error != 0) {
2480ff825849SDag-Erling Smørgrav 			log_err_addr("tcp connect", strerror(error),
2481865f46b2SCy Schubert 				&c->repinfo.remote_addr,
2482865f46b2SCy Schubert 				c->repinfo.remote_addrlen);
2483b7579f77SDag-Erling Smørgrav #else /* USE_WINSOCK */
2484b7579f77SDag-Erling Smørgrav 		/* examine error */
2485b7579f77SDag-Erling Smørgrav 		if(error == WSAEINPROGRESS)
2486b7579f77SDag-Erling Smørgrav 			return 1;
2487b7579f77SDag-Erling Smørgrav 		else if(error == WSAEWOULDBLOCK) {
2488e2d15004SDag-Erling Smørgrav 			ub_winsock_tcp_wouldblock(c->ev->ev, UB_EV_WRITE);
2489b7579f77SDag-Erling Smørgrav 			return 1;
2490b7579f77SDag-Erling Smørgrav 		} else if(error != 0 && verbosity < 2)
2491b7579f77SDag-Erling Smørgrav 			return 0;
2492b7579f77SDag-Erling Smørgrav 		else if(error != 0) {
2493ff825849SDag-Erling Smørgrav 			log_err_addr("tcp connect", wsa_strerror(error),
2494865f46b2SCy Schubert 				&c->repinfo.remote_addr,
2495865f46b2SCy Schubert 				c->repinfo.remote_addrlen);
2496b7579f77SDag-Erling Smørgrav #endif /* USE_WINSOCK */
2497b7579f77SDag-Erling Smørgrav 			return 0;
2498b7579f77SDag-Erling Smørgrav 		}
2499b7579f77SDag-Erling Smørgrav 	}
2500b7579f77SDag-Erling Smørgrav 	if(c->ssl)
2501369c6923SCy Schubert 		return ssl_handle_it(c, 1);
2502b7579f77SDag-Erling Smørgrav 
2503b5663de9SDag-Erling Smørgrav #ifdef USE_MSG_FASTOPEN
2504b5663de9SDag-Erling Smørgrav 	/* Only try this on first use of a connection that uses tfo,
2505b5663de9SDag-Erling Smørgrav 	   otherwise fall through to normal write */
2506b5663de9SDag-Erling Smørgrav 	/* Also, TFO support on WINDOWS not implemented at the moment */
2507b5663de9SDag-Erling Smørgrav 	if(c->tcp_do_fastopen == 1) {
2508b5663de9SDag-Erling Smørgrav 		/* this form of sendmsg() does both a connect() and send() so need to
2509b5663de9SDag-Erling Smørgrav 		   look for various flavours of error*/
2510369c6923SCy Schubert 		uint16_t len = htons(c->tcp_write_and_read?c->tcp_write_pkt_len:sldns_buffer_limit(buffer));
2511b5663de9SDag-Erling Smørgrav 		struct msghdr msg;
2512b5663de9SDag-Erling Smørgrav 		struct iovec iov[2];
2513b5663de9SDag-Erling Smørgrav 		c->tcp_do_fastopen = 0;
2514b5663de9SDag-Erling Smørgrav 		memset(&msg, 0, sizeof(msg));
2515369c6923SCy Schubert 		if(c->tcp_write_and_read) {
2516369c6923SCy Schubert 			iov[0].iov_base = (uint8_t*)&len + c->tcp_write_byte_count;
2517369c6923SCy Schubert 			iov[0].iov_len = sizeof(uint16_t) - c->tcp_write_byte_count;
2518369c6923SCy Schubert 			iov[1].iov_base = c->tcp_write_pkt;
2519369c6923SCy Schubert 			iov[1].iov_len = c->tcp_write_pkt_len;
2520369c6923SCy Schubert 		} else {
2521b5663de9SDag-Erling Smørgrav 			iov[0].iov_base = (uint8_t*)&len + c->tcp_byte_count;
2522b5663de9SDag-Erling Smørgrav 			iov[0].iov_len = sizeof(uint16_t) - c->tcp_byte_count;
252365b390aaSDag-Erling Smørgrav 			iov[1].iov_base = sldns_buffer_begin(buffer);
252465b390aaSDag-Erling Smørgrav 			iov[1].iov_len = sldns_buffer_limit(buffer);
2525369c6923SCy Schubert 		}
2526b5663de9SDag-Erling Smørgrav 		log_assert(iov[0].iov_len > 0);
2527865f46b2SCy Schubert 		msg.msg_name = &c->repinfo.remote_addr;
2528865f46b2SCy Schubert 		msg.msg_namelen = c->repinfo.remote_addrlen;
2529b5663de9SDag-Erling Smørgrav 		msg.msg_iov = iov;
2530b5663de9SDag-Erling Smørgrav 		msg.msg_iovlen = 2;
2531b5663de9SDag-Erling Smørgrav 		r = sendmsg(fd, &msg, MSG_FASTOPEN);
2532b5663de9SDag-Erling Smørgrav 		if (r == -1) {
2533b5663de9SDag-Erling Smørgrav #if defined(EINPROGRESS) && defined(EWOULDBLOCK)
2534b5663de9SDag-Erling Smørgrav 			/* Handshake is underway, maybe because no TFO cookie available.
25358a384985SDag-Erling Smørgrav 			   Come back to write the message*/
2536b5663de9SDag-Erling Smørgrav 			if(errno == EINPROGRESS || errno == EWOULDBLOCK)
2537b5663de9SDag-Erling Smørgrav 				return 1;
2538b5663de9SDag-Erling Smørgrav #endif
2539b5663de9SDag-Erling Smørgrav 			if(errno == EINTR || errno == EAGAIN)
2540b5663de9SDag-Erling Smørgrav 				return 1;
2541b5663de9SDag-Erling Smørgrav 			/* Not handling EISCONN here as shouldn't ever hit that case.*/
254224e36522SCy Schubert 			if(errno != EPIPE
254324e36522SCy Schubert #ifdef EOPNOTSUPP
254424e36522SCy Schubert 				/* if /proc/sys/net/ipv4/tcp_fastopen is
254524e36522SCy Schubert 				 * disabled on Linux, sendmsg may return
254624e36522SCy Schubert 				 * 'Operation not supported', if so
254724e36522SCy Schubert 				 * fallthrough to ordinary connect. */
254824e36522SCy Schubert 				&& errno != EOPNOTSUPP
254924e36522SCy Schubert #endif
255024e36522SCy Schubert 				&& errno != 0) {
255124e36522SCy Schubert 				if(verbosity < 2)
2552b5663de9SDag-Erling Smørgrav 					return 0; /* silence lots of chatter in the logs */
2553b5663de9SDag-Erling Smørgrav 				log_err_addr("tcp sendmsg", strerror(errno),
2554865f46b2SCy Schubert 					&c->repinfo.remote_addr,
2555865f46b2SCy Schubert 					c->repinfo.remote_addrlen);
2556b5663de9SDag-Erling Smørgrav 				return 0;
2557c7f4d7adSDag-Erling Smørgrav 			}
255824e36522SCy Schubert 			verbose(VERB_ALGO, "tcp sendmsg for fastopen failed (with %s), try normal connect", strerror(errno));
2559c7f4d7adSDag-Erling Smørgrav 			/* fallthrough to nonFASTOPEN
2560c7f4d7adSDag-Erling Smørgrav 			 * (MSG_FASTOPEN on Linux 3 produces EPIPE)
2561c7f4d7adSDag-Erling Smørgrav 			 * we need to perform connect() */
2562865f46b2SCy Schubert 			if(connect(fd, (struct sockaddr *)&c->repinfo.remote_addr,
2563865f46b2SCy Schubert 				c->repinfo.remote_addrlen) == -1) {
2564c7f4d7adSDag-Erling Smørgrav #ifdef EINPROGRESS
2565c7f4d7adSDag-Erling Smørgrav 				if(errno == EINPROGRESS)
2566c7f4d7adSDag-Erling Smørgrav 					return 1; /* wait until connect done*/
2567c7f4d7adSDag-Erling Smørgrav #endif
2568c7f4d7adSDag-Erling Smørgrav #ifdef USE_WINSOCK
2569c7f4d7adSDag-Erling Smørgrav 				if(WSAGetLastError() == WSAEINPROGRESS ||
2570c7f4d7adSDag-Erling Smørgrav 					WSAGetLastError() == WSAEWOULDBLOCK)
2571c7f4d7adSDag-Erling Smørgrav 					return 1; /* wait until connect done*/
2572c7f4d7adSDag-Erling Smørgrav #endif
2573c7f4d7adSDag-Erling Smørgrav 				if(tcp_connect_errno_needs_log(
2574865f46b2SCy Schubert 					(struct sockaddr *)&c->repinfo.remote_addr,
2575865f46b2SCy Schubert 					c->repinfo.remote_addrlen)) {
2576c7f4d7adSDag-Erling Smørgrav 					log_err_addr("outgoing tcp: connect after EPIPE for fastopen",
2577865f46b2SCy Schubert 						strerror(errno),
2578865f46b2SCy Schubert 						&c->repinfo.remote_addr,
2579865f46b2SCy Schubert 						c->repinfo.remote_addrlen);
2580c7f4d7adSDag-Erling Smørgrav 				}
2581c7f4d7adSDag-Erling Smørgrav 				return 0;
2582c7f4d7adSDag-Erling Smørgrav 			}
2583c7f4d7adSDag-Erling Smørgrav 
2584b5663de9SDag-Erling Smørgrav 		} else {
2585369c6923SCy Schubert 			if(c->tcp_write_and_read) {
2586369c6923SCy Schubert 				c->tcp_write_byte_count += r;
2587369c6923SCy Schubert 				if(c->tcp_write_byte_count < sizeof(uint16_t))
2588369c6923SCy Schubert 					return 1;
2589369c6923SCy Schubert 			} else {
2590b5663de9SDag-Erling Smørgrav 				c->tcp_byte_count += r;
2591b5663de9SDag-Erling Smørgrav 				if(c->tcp_byte_count < sizeof(uint16_t))
2592b5663de9SDag-Erling Smørgrav 					return 1;
259365b390aaSDag-Erling Smørgrav 				sldns_buffer_set_position(buffer, c->tcp_byte_count -
2594b5663de9SDag-Erling Smørgrav 					sizeof(uint16_t));
2595369c6923SCy Schubert 			}
2596369c6923SCy Schubert 			if((!c->tcp_write_and_read && sldns_buffer_remaining(buffer) == 0) || (c->tcp_write_and_read && c->tcp_write_byte_count == c->tcp_write_pkt_len + 2)) {
2597b5663de9SDag-Erling Smørgrav 				tcp_callback_writer(c);
2598b5663de9SDag-Erling Smørgrav 				return 1;
2599b5663de9SDag-Erling Smørgrav 			}
2600b5663de9SDag-Erling Smørgrav 		}
2601b5663de9SDag-Erling Smørgrav 	}
2602b5663de9SDag-Erling Smørgrav #endif /* USE_MSG_FASTOPEN */
2603b5663de9SDag-Erling Smørgrav 
2604369c6923SCy Schubert 	if((c->tcp_write_and_read?c->tcp_write_byte_count:c->tcp_byte_count) < sizeof(uint16_t)) {
2605369c6923SCy Schubert 		uint16_t len = htons(c->tcp_write_and_read?c->tcp_write_pkt_len:sldns_buffer_limit(buffer));
2606b7579f77SDag-Erling Smørgrav #ifdef HAVE_WRITEV
2607b7579f77SDag-Erling Smørgrav 		struct iovec iov[2];
2608369c6923SCy Schubert 		if(c->tcp_write_and_read) {
2609369c6923SCy Schubert 			iov[0].iov_base = (uint8_t*)&len + c->tcp_write_byte_count;
2610369c6923SCy Schubert 			iov[0].iov_len = sizeof(uint16_t) - c->tcp_write_byte_count;
2611369c6923SCy Schubert 			iov[1].iov_base = c->tcp_write_pkt;
2612369c6923SCy Schubert 			iov[1].iov_len = c->tcp_write_pkt_len;
2613369c6923SCy Schubert 		} else {
2614b7579f77SDag-Erling Smørgrav 			iov[0].iov_base = (uint8_t*)&len + c->tcp_byte_count;
2615b7579f77SDag-Erling Smørgrav 			iov[0].iov_len = sizeof(uint16_t) - c->tcp_byte_count;
261665b390aaSDag-Erling Smørgrav 			iov[1].iov_base = sldns_buffer_begin(buffer);
261765b390aaSDag-Erling Smørgrav 			iov[1].iov_len = sldns_buffer_limit(buffer);
2618369c6923SCy Schubert 		}
2619b7579f77SDag-Erling Smørgrav 		log_assert(iov[0].iov_len > 0);
2620b7579f77SDag-Erling Smørgrav 		r = writev(fd, iov, 2);
2621b7579f77SDag-Erling Smørgrav #else /* HAVE_WRITEV */
2622369c6923SCy Schubert 		if(c->tcp_write_and_read) {
2623369c6923SCy Schubert 			r = send(fd, (void*)(((uint8_t*)&len)+c->tcp_write_byte_count),
2624369c6923SCy Schubert 				sizeof(uint16_t)-c->tcp_write_byte_count, 0);
2625369c6923SCy Schubert 		} else {
2626b7579f77SDag-Erling Smørgrav 			r = send(fd, (void*)(((uint8_t*)&len)+c->tcp_byte_count),
2627b7579f77SDag-Erling Smørgrav 				sizeof(uint16_t)-c->tcp_byte_count, 0);
2628369c6923SCy Schubert 		}
2629b7579f77SDag-Erling Smørgrav #endif /* HAVE_WRITEV */
2630b7579f77SDag-Erling Smørgrav 		if(r == -1) {
2631b7579f77SDag-Erling Smørgrav #ifndef USE_WINSOCK
2632b7579f77SDag-Erling Smørgrav #  ifdef EPIPE
2633b7579f77SDag-Erling Smørgrav                 	if(errno == EPIPE && verbosity < 2)
2634b7579f77SDag-Erling Smørgrav                         	return 0; /* silence 'broken pipe' */
2635b7579f77SDag-Erling Smørgrav   #endif
2636b7579f77SDag-Erling Smørgrav 			if(errno == EINTR || errno == EAGAIN)
2637b7579f77SDag-Erling Smørgrav 				return 1;
2638e86b9096SDag-Erling Smørgrav #ifdef ECONNRESET
2639e86b9096SDag-Erling Smørgrav 			if(errno == ECONNRESET && verbosity < 2)
2640e86b9096SDag-Erling Smørgrav 				return 0; /* silence reset by peer */
2641e86b9096SDag-Erling Smørgrav #endif
2642ff825849SDag-Erling Smørgrav #  ifdef HAVE_WRITEV
2643ff825849SDag-Erling Smørgrav 			log_err_addr("tcp writev", strerror(errno),
2644865f46b2SCy Schubert 				&c->repinfo.remote_addr,
2645865f46b2SCy Schubert 				c->repinfo.remote_addrlen);
2646ff825849SDag-Erling Smørgrav #  else /* HAVE_WRITEV */
2647ff825849SDag-Erling Smørgrav 			log_err_addr("tcp send s", strerror(errno),
2648865f46b2SCy Schubert 				&c->repinfo.remote_addr,
2649865f46b2SCy Schubert 				c->repinfo.remote_addrlen);
2650ff825849SDag-Erling Smørgrav #  endif /* HAVE_WRITEV */
2651b7579f77SDag-Erling Smørgrav #else
2652b7579f77SDag-Erling Smørgrav 			if(WSAGetLastError() == WSAENOTCONN)
2653b7579f77SDag-Erling Smørgrav 				return 1;
2654b7579f77SDag-Erling Smørgrav 			if(WSAGetLastError() == WSAEINPROGRESS)
2655b7579f77SDag-Erling Smørgrav 				return 1;
2656b7579f77SDag-Erling Smørgrav 			if(WSAGetLastError() == WSAEWOULDBLOCK) {
2657e2d15004SDag-Erling Smørgrav 				ub_winsock_tcp_wouldblock(c->ev->ev,
2658e2d15004SDag-Erling Smørgrav 					UB_EV_WRITE);
2659b7579f77SDag-Erling Smørgrav 				return 1;
2660b7579f77SDag-Erling Smørgrav 			}
2661e86b9096SDag-Erling Smørgrav 			if(WSAGetLastError() == WSAECONNRESET && verbosity < 2)
2662e86b9096SDag-Erling Smørgrav 				return 0; /* silence reset by peer */
2663ff825849SDag-Erling Smørgrav 			log_err_addr("tcp send s",
2664ff825849SDag-Erling Smørgrav 				wsa_strerror(WSAGetLastError()),
2665865f46b2SCy Schubert 				&c->repinfo.remote_addr,
2666865f46b2SCy Schubert 				c->repinfo.remote_addrlen);
2667b7579f77SDag-Erling Smørgrav #endif
2668b7579f77SDag-Erling Smørgrav 			return 0;
2669b7579f77SDag-Erling Smørgrav 		}
2670369c6923SCy Schubert 		if(c->tcp_write_and_read) {
2671369c6923SCy Schubert 			c->tcp_write_byte_count += r;
2672369c6923SCy Schubert 			if(c->tcp_write_byte_count < sizeof(uint16_t))
2673369c6923SCy Schubert 				return 1;
2674369c6923SCy Schubert 		} else {
2675b7579f77SDag-Erling Smørgrav 			c->tcp_byte_count += r;
2676b7579f77SDag-Erling Smørgrav 			if(c->tcp_byte_count < sizeof(uint16_t))
2677b7579f77SDag-Erling Smørgrav 				return 1;
267865b390aaSDag-Erling Smørgrav 			sldns_buffer_set_position(buffer, c->tcp_byte_count -
2679b7579f77SDag-Erling Smørgrav 				sizeof(uint16_t));
2680369c6923SCy Schubert 		}
2681369c6923SCy Schubert 		if((!c->tcp_write_and_read && sldns_buffer_remaining(buffer) == 0) || (c->tcp_write_and_read && c->tcp_write_byte_count == c->tcp_write_pkt_len + 2)) {
2682b7579f77SDag-Erling Smørgrav 			tcp_callback_writer(c);
2683b7579f77SDag-Erling Smørgrav 			return 1;
2684b7579f77SDag-Erling Smørgrav 		}
2685b7579f77SDag-Erling Smørgrav 	}
2686369c6923SCy Schubert 	log_assert(c->tcp_write_and_read || sldns_buffer_remaining(buffer) > 0);
2687369c6923SCy Schubert 	log_assert(!c->tcp_write_and_read || c->tcp_write_byte_count < c->tcp_write_pkt_len + 2);
2688369c6923SCy Schubert 	if(c->tcp_write_and_read) {
2689f44e67d1SCy Schubert 		r = send(fd, (void*)(c->tcp_write_pkt + c->tcp_write_byte_count - 2),
2690369c6923SCy Schubert 			c->tcp_write_pkt_len + 2 - c->tcp_write_byte_count, 0);
2691369c6923SCy Schubert 	} else {
269265b390aaSDag-Erling Smørgrav 		r = send(fd, (void*)sldns_buffer_current(buffer),
269365b390aaSDag-Erling Smørgrav 			sldns_buffer_remaining(buffer), 0);
2694369c6923SCy Schubert 	}
2695b7579f77SDag-Erling Smørgrav 	if(r == -1) {
2696b7579f77SDag-Erling Smørgrav #ifndef USE_WINSOCK
2697b7579f77SDag-Erling Smørgrav 		if(errno == EINTR || errno == EAGAIN)
2698b7579f77SDag-Erling Smørgrav 			return 1;
2699e86b9096SDag-Erling Smørgrav #ifdef ECONNRESET
2700e86b9096SDag-Erling Smørgrav 		if(errno == ECONNRESET && verbosity < 2)
2701e86b9096SDag-Erling Smørgrav 			return 0; /* silence reset by peer */
2702e86b9096SDag-Erling Smørgrav #endif
2703b7579f77SDag-Erling Smørgrav #else
2704b7579f77SDag-Erling Smørgrav 		if(WSAGetLastError() == WSAEINPROGRESS)
2705b7579f77SDag-Erling Smørgrav 			return 1;
2706b7579f77SDag-Erling Smørgrav 		if(WSAGetLastError() == WSAEWOULDBLOCK) {
2707e2d15004SDag-Erling Smørgrav 			ub_winsock_tcp_wouldblock(c->ev->ev, UB_EV_WRITE);
2708b7579f77SDag-Erling Smørgrav 			return 1;
2709b7579f77SDag-Erling Smørgrav 		}
2710e86b9096SDag-Erling Smørgrav 		if(WSAGetLastError() == WSAECONNRESET && verbosity < 2)
2711e86b9096SDag-Erling Smørgrav 			return 0; /* silence reset by peer */
2712b7579f77SDag-Erling Smørgrav #endif
2713c0caa2e2SCy Schubert 		log_err_addr("tcp send r", sock_strerror(errno),
2714865f46b2SCy Schubert 			&c->repinfo.remote_addr,
2715865f46b2SCy Schubert 			c->repinfo.remote_addrlen);
2716b7579f77SDag-Erling Smørgrav 		return 0;
2717b7579f77SDag-Erling Smørgrav 	}
2718369c6923SCy Schubert 	if(c->tcp_write_and_read) {
2719369c6923SCy Schubert 		c->tcp_write_byte_count += r;
2720369c6923SCy Schubert 	} else {
272165b390aaSDag-Erling Smørgrav 		sldns_buffer_skip(buffer, r);
2722369c6923SCy Schubert 	}
2723b7579f77SDag-Erling Smørgrav 
2724369c6923SCy Schubert 	if((!c->tcp_write_and_read && sldns_buffer_remaining(buffer) == 0) || (c->tcp_write_and_read && c->tcp_write_byte_count == c->tcp_write_pkt_len + 2)) {
2725b7579f77SDag-Erling Smørgrav 		tcp_callback_writer(c);
2726b7579f77SDag-Erling Smørgrav 	}
2727b7579f77SDag-Erling Smørgrav 
2728b7579f77SDag-Erling Smørgrav 	return 1;
2729b7579f77SDag-Erling Smørgrav }
2730b7579f77SDag-Erling Smørgrav 
27311838dec3SCy Schubert /** read again to drain buffers when there could be more to read, returns 0
27321838dec3SCy Schubert  * on failure which means the comm point is closed. */
27331838dec3SCy Schubert static int
2734e86b9096SDag-Erling Smørgrav tcp_req_info_read_again(int fd, struct comm_point* c)
2735e86b9096SDag-Erling Smørgrav {
2736e86b9096SDag-Erling Smørgrav 	while(c->tcp_req_info->read_again) {
2737e86b9096SDag-Erling Smørgrav 		int r;
2738e86b9096SDag-Erling Smørgrav 		c->tcp_req_info->read_again = 0;
2739e86b9096SDag-Erling Smørgrav 		if(c->tcp_is_reading)
2740e86b9096SDag-Erling Smørgrav 			r = comm_point_tcp_handle_read(fd, c, 0);
2741e86b9096SDag-Erling Smørgrav 		else 	r = comm_point_tcp_handle_write(fd, c);
2742e86b9096SDag-Erling Smørgrav 		if(!r) {
2743e86b9096SDag-Erling Smørgrav 			reclaim_tcp_handler(c);
2744e86b9096SDag-Erling Smørgrav 			if(!c->tcp_do_close) {
2745e86b9096SDag-Erling Smørgrav 				fptr_ok(fptr_whitelist_comm_point(
2746e86b9096SDag-Erling Smørgrav 					c->callback));
2747e86b9096SDag-Erling Smørgrav 				(void)(*c->callback)(c, c->cb_arg,
2748e86b9096SDag-Erling Smørgrav 					NETEVENT_CLOSED, NULL);
2749e86b9096SDag-Erling Smørgrav 			}
27501838dec3SCy Schubert 			return 0;
2751e86b9096SDag-Erling Smørgrav 		}
2752e86b9096SDag-Erling Smørgrav 	}
27531838dec3SCy Schubert 	return 1;
2754e86b9096SDag-Erling Smørgrav }
2755e86b9096SDag-Erling Smørgrav 
2756369c6923SCy Schubert /** read again to drain buffers when there could be more to read */
2757369c6923SCy Schubert static void
2758369c6923SCy Schubert tcp_more_read_again(int fd, struct comm_point* c)
2759369c6923SCy Schubert {
2760369c6923SCy Schubert 	/* if the packet is done, but another one could be waiting on
2761369c6923SCy Schubert 	 * the connection, the callback signals this, and we try again */
2762369c6923SCy Schubert 	/* this continues until the read routines get EAGAIN or so,
2763369c6923SCy Schubert 	 * and thus does not call the callback, and the bool is 0 */
2764369c6923SCy Schubert 	int* moreread = c->tcp_more_read_again;
2765369c6923SCy Schubert 	while(moreread && *moreread) {
2766369c6923SCy Schubert 		*moreread = 0;
2767369c6923SCy Schubert 		if(!comm_point_tcp_handle_read(fd, c, 0)) {
2768369c6923SCy Schubert 			reclaim_tcp_handler(c);
2769369c6923SCy Schubert 			if(!c->tcp_do_close) {
2770369c6923SCy Schubert 				fptr_ok(fptr_whitelist_comm_point(
2771369c6923SCy Schubert 					c->callback));
2772369c6923SCy Schubert 				(void)(*c->callback)(c, c->cb_arg,
2773369c6923SCy Schubert 					NETEVENT_CLOSED, NULL);
2774369c6923SCy Schubert 			}
2775369c6923SCy Schubert 			return;
2776369c6923SCy Schubert 		}
2777369c6923SCy Schubert 	}
2778369c6923SCy Schubert }
2779369c6923SCy Schubert 
2780369c6923SCy Schubert /** write again to fill up when there could be more to write */
2781369c6923SCy Schubert static void
2782369c6923SCy Schubert tcp_more_write_again(int fd, struct comm_point* c)
2783369c6923SCy Schubert {
2784369c6923SCy Schubert 	/* if the packet is done, but another is waiting to be written,
2785369c6923SCy Schubert 	 * the callback signals it and we try again. */
2786369c6923SCy Schubert 	/* this continues until the write routines get EAGAIN or so,
2787369c6923SCy Schubert 	 * and thus does not call the callback, and the bool is 0 */
2788369c6923SCy Schubert 	int* morewrite = c->tcp_more_write_again;
2789369c6923SCy Schubert 	while(morewrite && *morewrite) {
2790369c6923SCy Schubert 		*morewrite = 0;
2791369c6923SCy Schubert 		if(!comm_point_tcp_handle_write(fd, c)) {
2792369c6923SCy Schubert 			reclaim_tcp_handler(c);
2793369c6923SCy Schubert 			if(!c->tcp_do_close) {
2794369c6923SCy Schubert 				fptr_ok(fptr_whitelist_comm_point(
2795369c6923SCy Schubert 					c->callback));
2796369c6923SCy Schubert 				(void)(*c->callback)(c, c->cb_arg,
2797369c6923SCy Schubert 					NETEVENT_CLOSED, NULL);
2798369c6923SCy Schubert 			}
2799369c6923SCy Schubert 			return;
2800369c6923SCy Schubert 		}
2801369c6923SCy Schubert 	}
2802369c6923SCy Schubert }
2803369c6923SCy Schubert 
2804b7579f77SDag-Erling Smørgrav void
2805b7579f77SDag-Erling Smørgrav comm_point_tcp_handle_callback(int fd, short event, void* arg)
2806b7579f77SDag-Erling Smørgrav {
2807b7579f77SDag-Erling Smørgrav 	struct comm_point* c = (struct comm_point*)arg;
2808b7579f77SDag-Erling Smørgrav 	log_assert(c->type == comm_tcp);
2809e2d15004SDag-Erling Smørgrav 	ub_comm_base_now(c->ev->base);
2810b7579f77SDag-Erling Smørgrav 
28111838dec3SCy Schubert 	if(c->fd == -1 || c->fd != fd)
28121838dec3SCy Schubert 		return; /* duplicate event, but commpoint closed. */
28131838dec3SCy Schubert 
281465b390aaSDag-Erling Smørgrav #ifdef USE_DNSCRYPT
281565b390aaSDag-Erling Smørgrav 	/* Initialize if this is a dnscrypt socket */
281665b390aaSDag-Erling Smørgrav 	if(c->tcp_parent) {
281765b390aaSDag-Erling Smørgrav 		c->dnscrypt = c->tcp_parent->dnscrypt;
281865b390aaSDag-Erling Smørgrav 	}
281965b390aaSDag-Erling Smørgrav 	if(c->dnscrypt && c->dnscrypt_buffer == c->buffer) {
282065b390aaSDag-Erling Smørgrav 		c->dnscrypt_buffer = sldns_buffer_new(sldns_buffer_capacity(c->buffer));
282165b390aaSDag-Erling Smørgrav 		if(!c->dnscrypt_buffer) {
282265b390aaSDag-Erling Smørgrav 			log_err("Could not allocate dnscrypt buffer");
2823971980c3SDag-Erling Smørgrav 			reclaim_tcp_handler(c);
2824971980c3SDag-Erling Smørgrav 			if(!c->tcp_do_close) {
2825971980c3SDag-Erling Smørgrav 				fptr_ok(fptr_whitelist_comm_point(
2826971980c3SDag-Erling Smørgrav 					c->callback));
2827971980c3SDag-Erling Smørgrav 				(void)(*c->callback)(c, c->cb_arg,
2828971980c3SDag-Erling Smørgrav 					NETEVENT_CLOSED, NULL);
2829971980c3SDag-Erling Smørgrav 			}
283065b390aaSDag-Erling Smørgrav 			return;
283165b390aaSDag-Erling Smørgrav 		}
283265b390aaSDag-Erling Smørgrav 	}
283365b390aaSDag-Erling Smørgrav #endif
283465b390aaSDag-Erling Smørgrav 
2835e86b9096SDag-Erling Smørgrav 	if(event&UB_EV_TIMEOUT) {
2836e86b9096SDag-Erling Smørgrav 		verbose(VERB_QUERY, "tcp took too long, dropped");
2837e86b9096SDag-Erling Smørgrav 		reclaim_tcp_handler(c);
2838e86b9096SDag-Erling Smørgrav 		if(!c->tcp_do_close) {
2839e86b9096SDag-Erling Smørgrav 			fptr_ok(fptr_whitelist_comm_point(c->callback));
2840e86b9096SDag-Erling Smørgrav 			(void)(*c->callback)(c, c->cb_arg,
2841e86b9096SDag-Erling Smørgrav 				NETEVENT_TIMEOUT, NULL);
2842e86b9096SDag-Erling Smørgrav 		}
2843e86b9096SDag-Erling Smørgrav 		return;
2844e86b9096SDag-Erling Smørgrav 	}
2845369c6923SCy Schubert 	if(event&UB_EV_READ
2846369c6923SCy Schubert #ifdef USE_MSG_FASTOPEN
2847369c6923SCy Schubert 		&& !(c->tcp_do_fastopen && (event&UB_EV_WRITE))
2848369c6923SCy Schubert #endif
2849369c6923SCy Schubert 		) {
2850e86b9096SDag-Erling Smørgrav 		int has_tcpq = (c->tcp_req_info != NULL);
2851369c6923SCy Schubert 		int* moreread = c->tcp_more_read_again;
2852b7579f77SDag-Erling Smørgrav 		if(!comm_point_tcp_handle_read(fd, c, 0)) {
2853b7579f77SDag-Erling Smørgrav 			reclaim_tcp_handler(c);
2854b7579f77SDag-Erling Smørgrav 			if(!c->tcp_do_close) {
2855b7579f77SDag-Erling Smørgrav 				fptr_ok(fptr_whitelist_comm_point(
2856b7579f77SDag-Erling Smørgrav 					c->callback));
2857b7579f77SDag-Erling Smørgrav 				(void)(*c->callback)(c, c->cb_arg,
2858b7579f77SDag-Erling Smørgrav 					NETEVENT_CLOSED, NULL);
2859b7579f77SDag-Erling Smørgrav 			}
2860369c6923SCy Schubert 			return;
2861b7579f77SDag-Erling Smørgrav 		}
28621838dec3SCy Schubert 		if(has_tcpq && c->tcp_req_info && c->tcp_req_info->read_again) {
28631838dec3SCy Schubert 			if(!tcp_req_info_read_again(fd, c))
28641838dec3SCy Schubert 				return;
28651838dec3SCy Schubert 		}
2866369c6923SCy Schubert 		if(moreread && *moreread)
2867369c6923SCy Schubert 			tcp_more_read_again(fd, c);
2868b7579f77SDag-Erling Smørgrav 		return;
2869b7579f77SDag-Erling Smørgrav 	}
2870e2d15004SDag-Erling Smørgrav 	if(event&UB_EV_WRITE) {
2871e86b9096SDag-Erling Smørgrav 		int has_tcpq = (c->tcp_req_info != NULL);
2872369c6923SCy Schubert 		int* morewrite = c->tcp_more_write_again;
2873b7579f77SDag-Erling Smørgrav 		if(!comm_point_tcp_handle_write(fd, c)) {
2874b7579f77SDag-Erling Smørgrav 			reclaim_tcp_handler(c);
2875b7579f77SDag-Erling Smørgrav 			if(!c->tcp_do_close) {
2876b7579f77SDag-Erling Smørgrav 				fptr_ok(fptr_whitelist_comm_point(
2877b7579f77SDag-Erling Smørgrav 					c->callback));
2878b7579f77SDag-Erling Smørgrav 				(void)(*c->callback)(c, c->cb_arg,
2879b7579f77SDag-Erling Smørgrav 					NETEVENT_CLOSED, NULL);
2880b7579f77SDag-Erling Smørgrav 			}
2881369c6923SCy Schubert 			return;
2882b7579f77SDag-Erling Smørgrav 		}
28831838dec3SCy Schubert 		if(has_tcpq && c->tcp_req_info && c->tcp_req_info->read_again) {
28841838dec3SCy Schubert 			if(!tcp_req_info_read_again(fd, c))
28851838dec3SCy Schubert 				return;
28861838dec3SCy Schubert 		}
2887369c6923SCy Schubert 		if(morewrite && *morewrite)
2888369c6923SCy Schubert 			tcp_more_write_again(fd, c);
2889b7579f77SDag-Erling Smørgrav 		return;
2890b7579f77SDag-Erling Smørgrav 	}
2891b7579f77SDag-Erling Smørgrav 	log_err("Ignored event %d for tcphdl.", event);
2892b7579f77SDag-Erling Smørgrav }
2893b7579f77SDag-Erling Smørgrav 
289457bddd21SDag-Erling Smørgrav /** Make http handler free for next assignment */
289557bddd21SDag-Erling Smørgrav static void
289657bddd21SDag-Erling Smørgrav reclaim_http_handler(struct comm_point* c)
289757bddd21SDag-Erling Smørgrav {
289857bddd21SDag-Erling Smørgrav 	log_assert(c->type == comm_http);
289957bddd21SDag-Erling Smørgrav 	if(c->ssl) {
290057bddd21SDag-Erling Smørgrav #ifdef HAVE_SSL
290157bddd21SDag-Erling Smørgrav 		SSL_shutdown(c->ssl);
290257bddd21SDag-Erling Smørgrav 		SSL_free(c->ssl);
290357bddd21SDag-Erling Smørgrav 		c->ssl = NULL;
290457bddd21SDag-Erling Smørgrav #endif
290557bddd21SDag-Erling Smørgrav 	}
290657bddd21SDag-Erling Smørgrav 	comm_point_close(c);
290757bddd21SDag-Erling Smørgrav 	if(c->tcp_parent) {
290824e36522SCy Schubert 		if(c != c->tcp_parent->tcp_free) {
290957bddd21SDag-Erling Smørgrav 			c->tcp_parent->cur_tcp_count--;
291057bddd21SDag-Erling Smørgrav 			c->tcp_free = c->tcp_parent->tcp_free;
291157bddd21SDag-Erling Smørgrav 			c->tcp_parent->tcp_free = c;
291224e36522SCy Schubert 		}
291357bddd21SDag-Erling Smørgrav 		if(!c->tcp_free) {
291457bddd21SDag-Erling Smørgrav 			/* re-enable listening on accept socket */
291557bddd21SDag-Erling Smørgrav 			comm_point_start_listening(c->tcp_parent, -1, -1);
291657bddd21SDag-Erling Smørgrav 		}
291757bddd21SDag-Erling Smørgrav 	}
291857bddd21SDag-Erling Smørgrav }
291957bddd21SDag-Erling Smørgrav 
292057bddd21SDag-Erling Smørgrav /** read more data for http (with ssl) */
292157bddd21SDag-Erling Smørgrav static int
292257bddd21SDag-Erling Smørgrav ssl_http_read_more(struct comm_point* c)
292357bddd21SDag-Erling Smørgrav {
292457bddd21SDag-Erling Smørgrav #ifdef HAVE_SSL
292557bddd21SDag-Erling Smørgrav 	int r;
292657bddd21SDag-Erling Smørgrav 	log_assert(sldns_buffer_remaining(c->buffer) > 0);
292757bddd21SDag-Erling Smørgrav 	ERR_clear_error();
292857bddd21SDag-Erling Smørgrav 	r = SSL_read(c->ssl, (void*)sldns_buffer_current(c->buffer),
292957bddd21SDag-Erling Smørgrav 		(int)sldns_buffer_remaining(c->buffer));
293057bddd21SDag-Erling Smørgrav 	if(r <= 0) {
293157bddd21SDag-Erling Smørgrav 		int want = SSL_get_error(c->ssl, r);
293257bddd21SDag-Erling Smørgrav 		if(want == SSL_ERROR_ZERO_RETURN) {
293357bddd21SDag-Erling Smørgrav 			return 0; /* shutdown, closed */
293457bddd21SDag-Erling Smørgrav 		} else if(want == SSL_ERROR_WANT_READ) {
293557bddd21SDag-Erling Smørgrav 			return 1; /* read more later */
293657bddd21SDag-Erling Smørgrav 		} else if(want == SSL_ERROR_WANT_WRITE) {
293757bddd21SDag-Erling Smørgrav 			c->ssl_shake_state = comm_ssl_shake_hs_write;
293857bddd21SDag-Erling Smørgrav 			comm_point_listen_for_rw(c, 0, 1);
293957bddd21SDag-Erling Smørgrav 			return 1;
294057bddd21SDag-Erling Smørgrav 		} else if(want == SSL_ERROR_SYSCALL) {
2941e86b9096SDag-Erling Smørgrav #ifdef ECONNRESET
2942e86b9096SDag-Erling Smørgrav 			if(errno == ECONNRESET && verbosity < 2)
2943e86b9096SDag-Erling Smørgrav 				return 0; /* silence reset by peer */
2944e86b9096SDag-Erling Smørgrav #endif
294557bddd21SDag-Erling Smørgrav 			if(errno != 0)
294657bddd21SDag-Erling Smørgrav 				log_err("SSL_read syscall: %s",
294757bddd21SDag-Erling Smørgrav 					strerror(errno));
294857bddd21SDag-Erling Smørgrav 			return 0;
294957bddd21SDag-Erling Smørgrav 		}
2950103ba509SCy Schubert 		log_crypto_err_io("could not SSL_read", want);
295157bddd21SDag-Erling Smørgrav 		return 0;
295257bddd21SDag-Erling Smørgrav 	}
29535469a995SCy Schubert 	verbose(VERB_ALGO, "ssl http read more skip to %d + %d",
29545469a995SCy Schubert 		(int)sldns_buffer_position(c->buffer), (int)r);
295557bddd21SDag-Erling Smørgrav 	sldns_buffer_skip(c->buffer, (ssize_t)r);
295657bddd21SDag-Erling Smørgrav 	return 1;
295757bddd21SDag-Erling Smørgrav #else
295857bddd21SDag-Erling Smørgrav 	(void)c;
295957bddd21SDag-Erling Smørgrav 	return 0;
296057bddd21SDag-Erling Smørgrav #endif /* HAVE_SSL */
296157bddd21SDag-Erling Smørgrav }
296257bddd21SDag-Erling Smørgrav 
296357bddd21SDag-Erling Smørgrav /** read more data for http */
296457bddd21SDag-Erling Smørgrav static int
296557bddd21SDag-Erling Smørgrav http_read_more(int fd, struct comm_point* c)
296657bddd21SDag-Erling Smørgrav {
296757bddd21SDag-Erling Smørgrav 	ssize_t r;
296857bddd21SDag-Erling Smørgrav 	log_assert(sldns_buffer_remaining(c->buffer) > 0);
296957bddd21SDag-Erling Smørgrav 	r = recv(fd, (void*)sldns_buffer_current(c->buffer),
2970865f46b2SCy Schubert 		sldns_buffer_remaining(c->buffer), MSG_DONTWAIT);
297157bddd21SDag-Erling Smørgrav 	if(r == 0) {
297257bddd21SDag-Erling Smørgrav 		return 0;
297357bddd21SDag-Erling Smørgrav 	} else if(r == -1) {
297457bddd21SDag-Erling Smørgrav #ifndef USE_WINSOCK
297557bddd21SDag-Erling Smørgrav 		if(errno == EINTR || errno == EAGAIN)
297657bddd21SDag-Erling Smørgrav 			return 1;
297757bddd21SDag-Erling Smørgrav #else /* USE_WINSOCK */
297857bddd21SDag-Erling Smørgrav 		if(WSAGetLastError() == WSAECONNRESET)
297957bddd21SDag-Erling Smørgrav 			return 0;
298057bddd21SDag-Erling Smørgrav 		if(WSAGetLastError() == WSAEINPROGRESS)
298157bddd21SDag-Erling Smørgrav 			return 1;
298257bddd21SDag-Erling Smørgrav 		if(WSAGetLastError() == WSAEWOULDBLOCK) {
298357bddd21SDag-Erling Smørgrav 			ub_winsock_tcp_wouldblock(c->ev->ev, UB_EV_READ);
298457bddd21SDag-Erling Smørgrav 			return 1;
298557bddd21SDag-Erling Smørgrav 		}
298657bddd21SDag-Erling Smørgrav #endif
2987c0caa2e2SCy Schubert 		log_err_addr("read (in http r)", sock_strerror(errno),
2988865f46b2SCy Schubert 			&c->repinfo.remote_addr, c->repinfo.remote_addrlen);
298957bddd21SDag-Erling Smørgrav 		return 0;
299057bddd21SDag-Erling Smørgrav 	}
29915469a995SCy Schubert 	verbose(VERB_ALGO, "http read more skip to %d + %d",
29925469a995SCy Schubert 		(int)sldns_buffer_position(c->buffer), (int)r);
299357bddd21SDag-Erling Smørgrav 	sldns_buffer_skip(c->buffer, r);
299457bddd21SDag-Erling Smørgrav 	return 1;
299557bddd21SDag-Erling Smørgrav }
299657bddd21SDag-Erling Smørgrav 
299757bddd21SDag-Erling Smørgrav /** return true if http header has been read (one line complete) */
299857bddd21SDag-Erling Smørgrav static int
299957bddd21SDag-Erling Smørgrav http_header_done(sldns_buffer* buf)
300057bddd21SDag-Erling Smørgrav {
300157bddd21SDag-Erling Smørgrav 	size_t i;
300257bddd21SDag-Erling Smørgrav 	for(i=sldns_buffer_position(buf); i<sldns_buffer_limit(buf); i++) {
300357bddd21SDag-Erling Smørgrav 		/* there was a \r before the \n, but we ignore that */
300457bddd21SDag-Erling Smørgrav 		if((char)sldns_buffer_read_u8_at(buf, i) == '\n')
300557bddd21SDag-Erling Smørgrav 			return 1;
300657bddd21SDag-Erling Smørgrav 	}
300757bddd21SDag-Erling Smørgrav 	return 0;
300857bddd21SDag-Erling Smørgrav }
300957bddd21SDag-Erling Smørgrav 
301057bddd21SDag-Erling Smørgrav /** return character string into buffer for header line, moves buffer
301157bddd21SDag-Erling Smørgrav  * past that line and puts zero terminator into linefeed-newline */
301257bddd21SDag-Erling Smørgrav static char*
301357bddd21SDag-Erling Smørgrav http_header_line(sldns_buffer* buf)
301457bddd21SDag-Erling Smørgrav {
301557bddd21SDag-Erling Smørgrav 	char* result = (char*)sldns_buffer_current(buf);
301657bddd21SDag-Erling Smørgrav 	size_t i;
301757bddd21SDag-Erling Smørgrav 	for(i=sldns_buffer_position(buf); i<sldns_buffer_limit(buf); i++) {
301857bddd21SDag-Erling Smørgrav 		/* terminate the string on the \r */
301957bddd21SDag-Erling Smørgrav 		if((char)sldns_buffer_read_u8_at(buf, i) == '\r')
302057bddd21SDag-Erling Smørgrav 			sldns_buffer_write_u8_at(buf, i, 0);
302157bddd21SDag-Erling Smørgrav 		/* terminate on the \n and skip past the it and done */
302257bddd21SDag-Erling Smørgrav 		if((char)sldns_buffer_read_u8_at(buf, i) == '\n') {
302357bddd21SDag-Erling Smørgrav 			sldns_buffer_write_u8_at(buf, i, 0);
302457bddd21SDag-Erling Smørgrav 			sldns_buffer_set_position(buf, i+1);
302557bddd21SDag-Erling Smørgrav 			return result;
302657bddd21SDag-Erling Smørgrav 		}
302757bddd21SDag-Erling Smørgrav 	}
302857bddd21SDag-Erling Smørgrav 	return NULL;
302957bddd21SDag-Erling Smørgrav }
303057bddd21SDag-Erling Smørgrav 
303157bddd21SDag-Erling Smørgrav /** move unread buffer to start and clear rest for putting the rest into it */
303257bddd21SDag-Erling Smørgrav static void
303357bddd21SDag-Erling Smørgrav http_moveover_buffer(sldns_buffer* buf)
303457bddd21SDag-Erling Smørgrav {
303557bddd21SDag-Erling Smørgrav 	size_t pos = sldns_buffer_position(buf);
303657bddd21SDag-Erling Smørgrav 	size_t len = sldns_buffer_remaining(buf);
303757bddd21SDag-Erling Smørgrav 	sldns_buffer_clear(buf);
303857bddd21SDag-Erling Smørgrav 	memmove(sldns_buffer_begin(buf), sldns_buffer_at(buf, pos), len);
303957bddd21SDag-Erling Smørgrav 	sldns_buffer_set_position(buf, len);
304057bddd21SDag-Erling Smørgrav }
304157bddd21SDag-Erling Smørgrav 
304257bddd21SDag-Erling Smørgrav /** a http header is complete, process it */
304357bddd21SDag-Erling Smørgrav static int
304457bddd21SDag-Erling Smørgrav http_process_initial_header(struct comm_point* c)
304557bddd21SDag-Erling Smørgrav {
304657bddd21SDag-Erling Smørgrav 	char* line = http_header_line(c->buffer);
304757bddd21SDag-Erling Smørgrav 	if(!line) return 1;
304857bddd21SDag-Erling Smørgrav 	verbose(VERB_ALGO, "http header: %s", line);
304957bddd21SDag-Erling Smørgrav 	if(strncasecmp(line, "HTTP/1.1 ", 9) == 0) {
305057bddd21SDag-Erling Smørgrav 		/* check returncode */
305157bddd21SDag-Erling Smørgrav 		if(line[9] != '2') {
305257bddd21SDag-Erling Smørgrav 			verbose(VERB_ALGO, "http bad status %s", line+9);
305357bddd21SDag-Erling Smørgrav 			return 0;
305457bddd21SDag-Erling Smørgrav 		}
305557bddd21SDag-Erling Smørgrav 	} else if(strncasecmp(line, "Content-Length: ", 16) == 0) {
305657bddd21SDag-Erling Smørgrav 		if(!c->http_is_chunked)
305757bddd21SDag-Erling Smørgrav 			c->tcp_byte_count = (size_t)atoi(line+16);
305857bddd21SDag-Erling Smørgrav 	} else if(strncasecmp(line, "Transfer-Encoding: chunked", 19+7) == 0) {
305957bddd21SDag-Erling Smørgrav 		c->tcp_byte_count = 0;
306057bddd21SDag-Erling Smørgrav 		c->http_is_chunked = 1;
306157bddd21SDag-Erling Smørgrav 	} else if(line[0] == 0) {
306257bddd21SDag-Erling Smørgrav 		/* end of initial headers */
306357bddd21SDag-Erling Smørgrav 		c->http_in_headers = 0;
306457bddd21SDag-Erling Smørgrav 		if(c->http_is_chunked)
306557bddd21SDag-Erling Smørgrav 			c->http_in_chunk_headers = 1;
306657bddd21SDag-Erling Smørgrav 		/* remove header text from front of buffer
306757bddd21SDag-Erling Smørgrav 		 * the buffer is going to be used to return the data segment
306857bddd21SDag-Erling Smørgrav 		 * itself and we don't want the header to get returned
306957bddd21SDag-Erling Smørgrav 		 * prepended with it */
307057bddd21SDag-Erling Smørgrav 		http_moveover_buffer(c->buffer);
307157bddd21SDag-Erling Smørgrav 		sldns_buffer_flip(c->buffer);
307257bddd21SDag-Erling Smørgrav 		return 1;
307357bddd21SDag-Erling Smørgrav 	}
307457bddd21SDag-Erling Smørgrav 	/* ignore other headers */
307557bddd21SDag-Erling Smørgrav 	return 1;
307657bddd21SDag-Erling Smørgrav }
307757bddd21SDag-Erling Smørgrav 
307857bddd21SDag-Erling Smørgrav /** a chunk header is complete, process it, return 0=fail, 1=continue next
307957bddd21SDag-Erling Smørgrav  * header line, 2=done with chunked transfer*/
308057bddd21SDag-Erling Smørgrav static int
308157bddd21SDag-Erling Smørgrav http_process_chunk_header(struct comm_point* c)
308257bddd21SDag-Erling Smørgrav {
308357bddd21SDag-Erling Smørgrav 	char* line = http_header_line(c->buffer);
308457bddd21SDag-Erling Smørgrav 	if(!line) return 1;
308557bddd21SDag-Erling Smørgrav 	if(c->http_in_chunk_headers == 3) {
308657bddd21SDag-Erling Smørgrav 		verbose(VERB_ALGO, "http chunk trailer: %s", line);
308757bddd21SDag-Erling Smørgrav 		/* are we done ? */
308857bddd21SDag-Erling Smørgrav 		if(line[0] == 0 && c->tcp_byte_count == 0) {
308957bddd21SDag-Erling Smørgrav 			/* callback of http reader when NETEVENT_DONE,
309057bddd21SDag-Erling Smørgrav 			 * end of data, with no data in buffer */
309157bddd21SDag-Erling Smørgrav 			sldns_buffer_set_position(c->buffer, 0);
309257bddd21SDag-Erling Smørgrav 			sldns_buffer_set_limit(c->buffer, 0);
309357bddd21SDag-Erling Smørgrav 			fptr_ok(fptr_whitelist_comm_point(c->callback));
309457bddd21SDag-Erling Smørgrav 			(void)(*c->callback)(c, c->cb_arg, NETEVENT_DONE, NULL);
309557bddd21SDag-Erling Smørgrav 			/* return that we are done */
309657bddd21SDag-Erling Smørgrav 			return 2;
309757bddd21SDag-Erling Smørgrav 		}
309857bddd21SDag-Erling Smørgrav 		if(line[0] == 0) {
309957bddd21SDag-Erling Smørgrav 			/* continue with header of the next chunk */
310057bddd21SDag-Erling Smørgrav 			c->http_in_chunk_headers = 1;
310157bddd21SDag-Erling Smørgrav 			/* remove header text from front of buffer */
310257bddd21SDag-Erling Smørgrav 			http_moveover_buffer(c->buffer);
310357bddd21SDag-Erling Smørgrav 			sldns_buffer_flip(c->buffer);
310457bddd21SDag-Erling Smørgrav 			return 1;
310557bddd21SDag-Erling Smørgrav 		}
310657bddd21SDag-Erling Smørgrav 		/* ignore further trail headers */
310757bddd21SDag-Erling Smørgrav 		return 1;
310857bddd21SDag-Erling Smørgrav 	}
310957bddd21SDag-Erling Smørgrav 	verbose(VERB_ALGO, "http chunk header: %s", line);
311057bddd21SDag-Erling Smørgrav 	if(c->http_in_chunk_headers == 1) {
311157bddd21SDag-Erling Smørgrav 		/* read chunked start line */
311257bddd21SDag-Erling Smørgrav 		char* end = NULL;
311357bddd21SDag-Erling Smørgrav 		c->tcp_byte_count = (size_t)strtol(line, &end, 16);
311457bddd21SDag-Erling Smørgrav 		if(end == line)
311557bddd21SDag-Erling Smørgrav 			return 0;
311657bddd21SDag-Erling Smørgrav 		c->http_in_chunk_headers = 0;
311757bddd21SDag-Erling Smørgrav 		/* remove header text from front of buffer */
311857bddd21SDag-Erling Smørgrav 		http_moveover_buffer(c->buffer);
311957bddd21SDag-Erling Smørgrav 		sldns_buffer_flip(c->buffer);
312057bddd21SDag-Erling Smørgrav 		if(c->tcp_byte_count == 0) {
312157bddd21SDag-Erling Smørgrav 			/* done with chunks, process chunk_trailer lines */
312257bddd21SDag-Erling Smørgrav 			c->http_in_chunk_headers = 3;
312357bddd21SDag-Erling Smørgrav 		}
312457bddd21SDag-Erling Smørgrav 		return 1;
312557bddd21SDag-Erling Smørgrav 	}
312657bddd21SDag-Erling Smørgrav 	/* ignore other headers */
312757bddd21SDag-Erling Smørgrav 	return 1;
312857bddd21SDag-Erling Smørgrav }
312957bddd21SDag-Erling Smørgrav 
31305469a995SCy Schubert /** handle nonchunked data segment, 0=fail, 1=wait */
313157bddd21SDag-Erling Smørgrav static int
313257bddd21SDag-Erling Smørgrav http_nonchunk_segment(struct comm_point* c)
313357bddd21SDag-Erling Smørgrav {
313457bddd21SDag-Erling Smørgrav 	/* c->buffer at position..limit has new data we read in.
313557bddd21SDag-Erling Smørgrav 	 * the buffer itself is full of nonchunked data.
313657bddd21SDag-Erling Smørgrav 	 * we are looking to read tcp_byte_count more data
313757bddd21SDag-Erling Smørgrav 	 * and then the transfer is done. */
313857bddd21SDag-Erling Smørgrav 	size_t remainbufferlen;
31395469a995SCy Schubert 	size_t got_now = sldns_buffer_limit(c->buffer);
314057bddd21SDag-Erling Smørgrav 	if(c->tcp_byte_count <= got_now) {
314157bddd21SDag-Erling Smørgrav 		/* done, this is the last data fragment */
314257bddd21SDag-Erling Smørgrav 		c->http_stored = 0;
314357bddd21SDag-Erling Smørgrav 		sldns_buffer_set_position(c->buffer, 0);
314457bddd21SDag-Erling Smørgrav 		fptr_ok(fptr_whitelist_comm_point(c->callback));
314557bddd21SDag-Erling Smørgrav 		(void)(*c->callback)(c, c->cb_arg, NETEVENT_DONE, NULL);
314657bddd21SDag-Erling Smørgrav 		return 1;
314757bddd21SDag-Erling Smørgrav 	}
314857bddd21SDag-Erling Smørgrav 	/* if we have the buffer space,
314957bddd21SDag-Erling Smørgrav 	 * read more data collected into the buffer */
315057bddd21SDag-Erling Smørgrav 	remainbufferlen = sldns_buffer_capacity(c->buffer) -
315157bddd21SDag-Erling Smørgrav 		sldns_buffer_limit(c->buffer);
31525469a995SCy Schubert 	if(remainbufferlen+got_now >= c->tcp_byte_count ||
3153a39a5a69SCy Schubert 		remainbufferlen >= (size_t)(c->ssl?16384:2048)) {
315457bddd21SDag-Erling Smørgrav 		size_t total = sldns_buffer_limit(c->buffer);
315557bddd21SDag-Erling Smørgrav 		sldns_buffer_clear(c->buffer);
315657bddd21SDag-Erling Smørgrav 		sldns_buffer_set_position(c->buffer, total);
315757bddd21SDag-Erling Smørgrav 		c->http_stored = total;
315857bddd21SDag-Erling Smørgrav 		/* return and wait to read more */
315957bddd21SDag-Erling Smørgrav 		return 1;
316057bddd21SDag-Erling Smørgrav 	}
316157bddd21SDag-Erling Smørgrav 	/* call callback with this data amount, then
316257bddd21SDag-Erling Smørgrav 	 * wait for more */
31635469a995SCy Schubert 	c->tcp_byte_count -= got_now;
316457bddd21SDag-Erling Smørgrav 	c->http_stored = 0;
316557bddd21SDag-Erling Smørgrav 	sldns_buffer_set_position(c->buffer, 0);
316657bddd21SDag-Erling Smørgrav 	fptr_ok(fptr_whitelist_comm_point(c->callback));
316757bddd21SDag-Erling Smørgrav 	(void)(*c->callback)(c, c->cb_arg, NETEVENT_NOERROR, NULL);
316857bddd21SDag-Erling Smørgrav 	/* c->callback has to buffer_clear(c->buffer). */
316957bddd21SDag-Erling Smørgrav 	/* return and wait to read more */
317057bddd21SDag-Erling Smørgrav 	return 1;
317157bddd21SDag-Erling Smørgrav }
317257bddd21SDag-Erling Smørgrav 
3173f44e67d1SCy Schubert /** handle chunked data segment, return 0=fail, 1=wait, 2=process more */
317457bddd21SDag-Erling Smørgrav static int
317557bddd21SDag-Erling Smørgrav http_chunked_segment(struct comm_point* c)
317657bddd21SDag-Erling Smørgrav {
317757bddd21SDag-Erling Smørgrav 	/* the c->buffer has from position..limit new data we read. */
317857bddd21SDag-Erling Smørgrav 	/* the current chunk has length tcp_byte_count.
317957bddd21SDag-Erling Smørgrav 	 * once we read that read more chunk headers.
318057bddd21SDag-Erling Smørgrav 	 */
318157bddd21SDag-Erling Smørgrav 	size_t remainbufferlen;
318257bddd21SDag-Erling Smørgrav 	size_t got_now = sldns_buffer_limit(c->buffer) - c->http_stored;
3183f44e67d1SCy Schubert 	verbose(VERB_ALGO, "http_chunked_segment: got now %d, tcpbytcount %d, http_stored %d, buffer pos %d, buffer limit %d", (int)got_now, (int)c->tcp_byte_count, (int)c->http_stored, (int)sldns_buffer_position(c->buffer), (int)sldns_buffer_limit(c->buffer));
318457bddd21SDag-Erling Smørgrav 	if(c->tcp_byte_count <= got_now) {
318557bddd21SDag-Erling Smørgrav 		/* the chunk has completed (with perhaps some extra data
318657bddd21SDag-Erling Smørgrav 		 * from next chunk header and next chunk) */
318757bddd21SDag-Erling Smørgrav 		/* save too much info into temp buffer */
318857bddd21SDag-Erling Smørgrav 		size_t fraglen;
318957bddd21SDag-Erling Smørgrav 		struct comm_reply repinfo;
319057bddd21SDag-Erling Smørgrav 		c->http_stored = 0;
319157bddd21SDag-Erling Smørgrav 		sldns_buffer_skip(c->buffer, (ssize_t)c->tcp_byte_count);
319257bddd21SDag-Erling Smørgrav 		sldns_buffer_clear(c->http_temp);
319357bddd21SDag-Erling Smørgrav 		sldns_buffer_write(c->http_temp,
319457bddd21SDag-Erling Smørgrav 			sldns_buffer_current(c->buffer),
319557bddd21SDag-Erling Smørgrav 			sldns_buffer_remaining(c->buffer));
319657bddd21SDag-Erling Smørgrav 		sldns_buffer_flip(c->http_temp);
319757bddd21SDag-Erling Smørgrav 
319857bddd21SDag-Erling Smørgrav 		/* callback with this fragment */
319957bddd21SDag-Erling Smørgrav 		fraglen = sldns_buffer_position(c->buffer);
320057bddd21SDag-Erling Smørgrav 		sldns_buffer_set_position(c->buffer, 0);
320157bddd21SDag-Erling Smørgrav 		sldns_buffer_set_limit(c->buffer, fraglen);
320257bddd21SDag-Erling Smørgrav 		repinfo = c->repinfo;
320357bddd21SDag-Erling Smørgrav 		fptr_ok(fptr_whitelist_comm_point(c->callback));
320457bddd21SDag-Erling Smørgrav 		(void)(*c->callback)(c, c->cb_arg, NETEVENT_NOERROR, &repinfo);
320557bddd21SDag-Erling Smørgrav 		/* c->callback has to buffer_clear(). */
320657bddd21SDag-Erling Smørgrav 
320757bddd21SDag-Erling Smørgrav 		/* is commpoint deleted? */
320857bddd21SDag-Erling Smørgrav 		if(!repinfo.c) {
320957bddd21SDag-Erling Smørgrav 			return 1;
321057bddd21SDag-Erling Smørgrav 		}
321157bddd21SDag-Erling Smørgrav 		/* copy waiting info */
321257bddd21SDag-Erling Smørgrav 		sldns_buffer_clear(c->buffer);
321357bddd21SDag-Erling Smørgrav 		sldns_buffer_write(c->buffer,
321457bddd21SDag-Erling Smørgrav 			sldns_buffer_begin(c->http_temp),
321557bddd21SDag-Erling Smørgrav 			sldns_buffer_remaining(c->http_temp));
321657bddd21SDag-Erling Smørgrav 		sldns_buffer_flip(c->buffer);
321757bddd21SDag-Erling Smørgrav 		/* process end of chunk trailer header lines, until
321857bddd21SDag-Erling Smørgrav 		 * an empty line */
321957bddd21SDag-Erling Smørgrav 		c->http_in_chunk_headers = 3;
322057bddd21SDag-Erling Smørgrav 		/* process more data in buffer (if any) */
322157bddd21SDag-Erling Smørgrav 		return 2;
322257bddd21SDag-Erling Smørgrav 	}
322357bddd21SDag-Erling Smørgrav 	c->tcp_byte_count -= got_now;
322457bddd21SDag-Erling Smørgrav 
322557bddd21SDag-Erling Smørgrav 	/* if we have the buffer space,
322657bddd21SDag-Erling Smørgrav 	 * read more data collected into the buffer */
322757bddd21SDag-Erling Smørgrav 	remainbufferlen = sldns_buffer_capacity(c->buffer) -
322857bddd21SDag-Erling Smørgrav 		sldns_buffer_limit(c->buffer);
322957bddd21SDag-Erling Smørgrav 	if(remainbufferlen >= c->tcp_byte_count ||
323057bddd21SDag-Erling Smørgrav 		remainbufferlen >= 2048) {
323157bddd21SDag-Erling Smørgrav 		size_t total = sldns_buffer_limit(c->buffer);
323257bddd21SDag-Erling Smørgrav 		sldns_buffer_clear(c->buffer);
323357bddd21SDag-Erling Smørgrav 		sldns_buffer_set_position(c->buffer, total);
323457bddd21SDag-Erling Smørgrav 		c->http_stored = total;
323557bddd21SDag-Erling Smørgrav 		/* return and wait to read more */
323657bddd21SDag-Erling Smørgrav 		return 1;
323757bddd21SDag-Erling Smørgrav 	}
323857bddd21SDag-Erling Smørgrav 
323957bddd21SDag-Erling Smørgrav 	/* callback of http reader for a new part of the data */
324057bddd21SDag-Erling Smørgrav 	c->http_stored = 0;
324157bddd21SDag-Erling Smørgrav 	sldns_buffer_set_position(c->buffer, 0);
324257bddd21SDag-Erling Smørgrav 	fptr_ok(fptr_whitelist_comm_point(c->callback));
324357bddd21SDag-Erling Smørgrav 	(void)(*c->callback)(c, c->cb_arg, NETEVENT_NOERROR, NULL);
324457bddd21SDag-Erling Smørgrav 	/* c->callback has to buffer_clear(c->buffer). */
324557bddd21SDag-Erling Smørgrav 	/* return and wait to read more */
324657bddd21SDag-Erling Smørgrav 	return 1;
324757bddd21SDag-Erling Smørgrav }
324857bddd21SDag-Erling Smørgrav 
3249c0caa2e2SCy Schubert #ifdef HAVE_NGHTTP2
3250c0caa2e2SCy Schubert /** Create new http2 session. Called when creating handling comm point. */
3251f44e67d1SCy Schubert static struct http2_session* http2_session_create(struct comm_point* c)
3252c0caa2e2SCy Schubert {
3253c0caa2e2SCy Schubert 	struct http2_session* session = calloc(1, sizeof(*session));
3254c0caa2e2SCy Schubert 	if(!session) {
3255c0caa2e2SCy Schubert 		log_err("malloc failure while creating http2 session");
3256c0caa2e2SCy Schubert 		return NULL;
3257c0caa2e2SCy Schubert 	}
3258c0caa2e2SCy Schubert 	session->c = c;
3259c0caa2e2SCy Schubert 
3260c0caa2e2SCy Schubert 	return session;
3261c0caa2e2SCy Schubert }
3262c0caa2e2SCy Schubert #endif
3263c0caa2e2SCy Schubert 
3264c0caa2e2SCy Schubert /** Delete http2 session. After closing connection or on error */
3265f44e67d1SCy Schubert static void http2_session_delete(struct http2_session* h2_session)
3266c0caa2e2SCy Schubert {
3267c0caa2e2SCy Schubert #ifdef HAVE_NGHTTP2
3268c0caa2e2SCy Schubert 	if(h2_session->callbacks)
3269c0caa2e2SCy Schubert 		nghttp2_session_callbacks_del(h2_session->callbacks);
3270c0caa2e2SCy Schubert 	free(h2_session);
3271c0caa2e2SCy Schubert #else
3272c0caa2e2SCy Schubert 	(void)h2_session;
3273c0caa2e2SCy Schubert #endif
3274c0caa2e2SCy Schubert }
3275c0caa2e2SCy Schubert 
3276c0caa2e2SCy Schubert #ifdef HAVE_NGHTTP2
3277c0caa2e2SCy Schubert struct http2_stream* http2_stream_create(int32_t stream_id)
3278c0caa2e2SCy Schubert {
3279c0caa2e2SCy Schubert 	struct http2_stream* h2_stream = calloc(1, sizeof(*h2_stream));
3280c0caa2e2SCy Schubert 	if(!h2_stream) {
3281c0caa2e2SCy Schubert 		log_err("malloc failure while creating http2 stream");
3282c0caa2e2SCy Schubert 		return NULL;
3283c0caa2e2SCy Schubert 	}
3284c0caa2e2SCy Schubert 	h2_stream->stream_id = stream_id;
3285c0caa2e2SCy Schubert 	return h2_stream;
3286c0caa2e2SCy Schubert }
3287c0caa2e2SCy Schubert 
3288c0caa2e2SCy Schubert /** Delete http2 stream. After session delete or stream close callback */
3289c0caa2e2SCy Schubert static void http2_stream_delete(struct http2_session* h2_session,
3290c0caa2e2SCy Schubert 	struct http2_stream* h2_stream)
3291c0caa2e2SCy Schubert {
3292c0caa2e2SCy Schubert 	if(h2_stream->mesh_state) {
3293c0caa2e2SCy Schubert 		mesh_state_remove_reply(h2_stream->mesh, h2_stream->mesh_state,
3294c0caa2e2SCy Schubert 			h2_session->c);
3295c0caa2e2SCy Schubert 		h2_stream->mesh_state = NULL;
3296c0caa2e2SCy Schubert 	}
3297c0caa2e2SCy Schubert 	http2_req_stream_clear(h2_stream);
3298c0caa2e2SCy Schubert 	free(h2_stream);
3299c0caa2e2SCy Schubert }
3300c0caa2e2SCy Schubert #endif
3301c0caa2e2SCy Schubert 
3302c0caa2e2SCy Schubert void http2_stream_add_meshstate(struct http2_stream* h2_stream,
3303c0caa2e2SCy Schubert 	struct mesh_area* mesh, struct mesh_state* m)
3304c0caa2e2SCy Schubert {
3305c0caa2e2SCy Schubert 	h2_stream->mesh = mesh;
3306c0caa2e2SCy Schubert 	h2_stream->mesh_state = m;
3307c0caa2e2SCy Schubert }
3308c0caa2e2SCy Schubert 
3309c0caa2e2SCy Schubert /** delete http2 session server. After closing connection. */
3310c0caa2e2SCy Schubert static void http2_session_server_delete(struct http2_session* h2_session)
3311c0caa2e2SCy Schubert {
3312c0caa2e2SCy Schubert #ifdef HAVE_NGHTTP2
3313c0caa2e2SCy Schubert 	struct http2_stream* h2_stream, *next;
3314c0caa2e2SCy Schubert 	nghttp2_session_del(h2_session->session); /* NULL input is fine */
3315c0caa2e2SCy Schubert 	h2_session->session = NULL;
3316c0caa2e2SCy Schubert 	for(h2_stream = h2_session->first_stream; h2_stream;) {
3317c0caa2e2SCy Schubert 		next = h2_stream->next;
3318c0caa2e2SCy Schubert 		http2_stream_delete(h2_session, h2_stream);
3319c0caa2e2SCy Schubert 		h2_stream = next;
3320c0caa2e2SCy Schubert 	}
3321c0caa2e2SCy Schubert 	h2_session->first_stream = NULL;
3322c0caa2e2SCy Schubert 	h2_session->is_drop = 0;
3323c0caa2e2SCy Schubert 	h2_session->postpone_drop = 0;
3324c0caa2e2SCy Schubert 	h2_session->c->h2_stream = NULL;
3325c0caa2e2SCy Schubert #endif
3326c0caa2e2SCy Schubert 	(void)h2_session;
3327c0caa2e2SCy Schubert }
3328c0caa2e2SCy Schubert 
3329c0caa2e2SCy Schubert #ifdef HAVE_NGHTTP2
3330c0caa2e2SCy Schubert void http2_session_add_stream(struct http2_session* h2_session,
3331c0caa2e2SCy Schubert 	struct http2_stream* h2_stream)
3332c0caa2e2SCy Schubert {
3333c0caa2e2SCy Schubert 	if(h2_session->first_stream)
3334c0caa2e2SCy Schubert 		h2_session->first_stream->prev = h2_stream;
3335c0caa2e2SCy Schubert 	h2_stream->next = h2_session->first_stream;
3336c0caa2e2SCy Schubert 	h2_session->first_stream = h2_stream;
3337c0caa2e2SCy Schubert }
3338c0caa2e2SCy Schubert 
3339c0caa2e2SCy Schubert /** remove stream from session linked list. After stream close callback or
3340c0caa2e2SCy Schubert  * closing connection */
3341f44e67d1SCy Schubert static void http2_session_remove_stream(struct http2_session* h2_session,
3342c0caa2e2SCy Schubert 	struct http2_stream* h2_stream)
3343c0caa2e2SCy Schubert {
3344c0caa2e2SCy Schubert 	if(h2_stream->prev)
3345c0caa2e2SCy Schubert 		h2_stream->prev->next = h2_stream->next;
3346c0caa2e2SCy Schubert 	else
3347c0caa2e2SCy Schubert 		h2_session->first_stream = h2_stream->next;
3348c0caa2e2SCy Schubert 	if(h2_stream->next)
3349c0caa2e2SCy Schubert 		h2_stream->next->prev = h2_stream->prev;
3350c0caa2e2SCy Schubert 
3351c0caa2e2SCy Schubert }
3352c0caa2e2SCy Schubert 
3353c0caa2e2SCy Schubert int http2_stream_close_cb(nghttp2_session* ATTR_UNUSED(session),
3354c0caa2e2SCy Schubert 	int32_t stream_id, uint32_t ATTR_UNUSED(error_code), void* cb_arg)
3355c0caa2e2SCy Schubert {
3356c0caa2e2SCy Schubert 	struct http2_stream* h2_stream;
3357c0caa2e2SCy Schubert 	struct http2_session* h2_session = (struct http2_session*)cb_arg;
3358c0caa2e2SCy Schubert 	if(!(h2_stream = nghttp2_session_get_stream_user_data(
3359c0caa2e2SCy Schubert 		h2_session->session, stream_id))) {
3360c0caa2e2SCy Schubert 		return 0;
3361c0caa2e2SCy Schubert 	}
3362c0caa2e2SCy Schubert 	http2_session_remove_stream(h2_session, h2_stream);
3363c0caa2e2SCy Schubert 	http2_stream_delete(h2_session, h2_stream);
3364c0caa2e2SCy Schubert 	return 0;
3365c0caa2e2SCy Schubert }
3366c0caa2e2SCy Schubert 
3367c0caa2e2SCy Schubert ssize_t http2_recv_cb(nghttp2_session* ATTR_UNUSED(session), uint8_t* buf,
3368c0caa2e2SCy Schubert 	size_t len, int ATTR_UNUSED(flags), void* cb_arg)
3369c0caa2e2SCy Schubert {
3370c0caa2e2SCy Schubert 	struct http2_session* h2_session = (struct http2_session*)cb_arg;
3371369c6923SCy Schubert 	ssize_t ret;
3372c0caa2e2SCy Schubert 
3373c0caa2e2SCy Schubert 	log_assert(h2_session->c->type == comm_http);
3374c0caa2e2SCy Schubert 	log_assert(h2_session->c->h2_session);
3375c0caa2e2SCy Schubert 
3376369c6923SCy Schubert #ifdef HAVE_SSL
3377369c6923SCy Schubert 	if(h2_session->c->ssl) {
3378369c6923SCy Schubert 		int r;
3379c0caa2e2SCy Schubert 		ERR_clear_error();
3380c0caa2e2SCy Schubert 		r = SSL_read(h2_session->c->ssl, buf, len);
3381c0caa2e2SCy Schubert 		if(r <= 0) {
3382c0caa2e2SCy Schubert 			int want = SSL_get_error(h2_session->c->ssl, r);
3383c0caa2e2SCy Schubert 			if(want == SSL_ERROR_ZERO_RETURN) {
3384c0caa2e2SCy Schubert 				return NGHTTP2_ERR_EOF;
3385c0caa2e2SCy Schubert 			} else if(want == SSL_ERROR_WANT_READ) {
3386c0caa2e2SCy Schubert 				return NGHTTP2_ERR_WOULDBLOCK;
3387c0caa2e2SCy Schubert 			} else if(want == SSL_ERROR_WANT_WRITE) {
3388c0caa2e2SCy Schubert 				h2_session->c->ssl_shake_state = comm_ssl_shake_hs_write;
3389c0caa2e2SCy Schubert 				comm_point_listen_for_rw(h2_session->c, 0, 1);
3390c0caa2e2SCy Schubert 				return NGHTTP2_ERR_WOULDBLOCK;
3391c0caa2e2SCy Schubert 			} else if(want == SSL_ERROR_SYSCALL) {
3392c0caa2e2SCy Schubert #ifdef ECONNRESET
3393c0caa2e2SCy Schubert 				if(errno == ECONNRESET && verbosity < 2)
3394c0caa2e2SCy Schubert 					return NGHTTP2_ERR_CALLBACK_FAILURE;
3395c0caa2e2SCy Schubert #endif
3396c0caa2e2SCy Schubert 				if(errno != 0)
3397c0caa2e2SCy Schubert 					log_err("SSL_read syscall: %s",
3398c0caa2e2SCy Schubert 						strerror(errno));
3399c0caa2e2SCy Schubert 				return NGHTTP2_ERR_CALLBACK_FAILURE;
3400c0caa2e2SCy Schubert 			}
3401103ba509SCy Schubert 			log_crypto_err_io("could not SSL_read", want);
3402c0caa2e2SCy Schubert 			return NGHTTP2_ERR_CALLBACK_FAILURE;
3403c0caa2e2SCy Schubert 		}
3404c0caa2e2SCy Schubert 		return r;
3405369c6923SCy Schubert 	}
3406369c6923SCy Schubert #endif /* HAVE_SSL */
3407369c6923SCy Schubert 
3408865f46b2SCy Schubert 	ret = recv(h2_session->c->fd, buf, len, MSG_DONTWAIT);
3409369c6923SCy Schubert 	if(ret == 0) {
3410369c6923SCy Schubert 		return NGHTTP2_ERR_EOF;
3411369c6923SCy Schubert 	} else if(ret < 0) {
3412369c6923SCy Schubert #ifndef USE_WINSOCK
3413369c6923SCy Schubert 		if(errno == EINTR || errno == EAGAIN)
3414369c6923SCy Schubert 			return NGHTTP2_ERR_WOULDBLOCK;
3415369c6923SCy Schubert #ifdef ECONNRESET
3416369c6923SCy Schubert 		if(errno == ECONNRESET && verbosity < 2)
3417369c6923SCy Schubert 			return NGHTTP2_ERR_CALLBACK_FAILURE;
3418c0caa2e2SCy Schubert #endif
3419369c6923SCy Schubert 		log_err_addr("could not http2 recv: %s", strerror(errno),
3420865f46b2SCy Schubert 			&h2_session->c->repinfo.remote_addr,
3421865f46b2SCy Schubert 			h2_session->c->repinfo.remote_addrlen);
3422369c6923SCy Schubert #else /* USE_WINSOCK */
3423369c6923SCy Schubert 		if(WSAGetLastError() == WSAECONNRESET)
3424369c6923SCy Schubert 			return NGHTTP2_ERR_CALLBACK_FAILURE;
3425369c6923SCy Schubert 		if(WSAGetLastError() == WSAEINPROGRESS)
3426369c6923SCy Schubert 			return NGHTTP2_ERR_WOULDBLOCK;
3427369c6923SCy Schubert 		if(WSAGetLastError() == WSAEWOULDBLOCK) {
3428369c6923SCy Schubert 			ub_winsock_tcp_wouldblock(h2_session->c->ev->ev,
3429369c6923SCy Schubert 				UB_EV_READ);
3430369c6923SCy Schubert 			return NGHTTP2_ERR_WOULDBLOCK;
3431369c6923SCy Schubert 		}
3432369c6923SCy Schubert 		log_err_addr("could not http2 recv: %s",
3433369c6923SCy Schubert 			wsa_strerror(WSAGetLastError()),
3434865f46b2SCy Schubert 			&h2_session->c->repinfo.remote_addr,
3435865f46b2SCy Schubert 			h2_session->c->repinfo.remote_addrlen);
3436369c6923SCy Schubert #endif
3437369c6923SCy Schubert 		return NGHTTP2_ERR_CALLBACK_FAILURE;
3438369c6923SCy Schubert 	}
3439369c6923SCy Schubert 	return ret;
3440c0caa2e2SCy Schubert }
3441c0caa2e2SCy Schubert #endif /* HAVE_NGHTTP2 */
3442c0caa2e2SCy Schubert 
3443c0caa2e2SCy Schubert /** Handle http2 read */
3444c0caa2e2SCy Schubert static int
3445c0caa2e2SCy Schubert comm_point_http2_handle_read(int ATTR_UNUSED(fd), struct comm_point* c)
3446c0caa2e2SCy Schubert {
3447c0caa2e2SCy Schubert #ifdef HAVE_NGHTTP2
3448c0caa2e2SCy Schubert 	int ret;
3449c0caa2e2SCy Schubert 	log_assert(c->h2_session);
3450c0caa2e2SCy Schubert 
3451c0caa2e2SCy Schubert 	/* reading until recv cb returns NGHTTP2_ERR_WOULDBLOCK */
3452c0caa2e2SCy Schubert 	ret = nghttp2_session_recv(c->h2_session->session);
3453c0caa2e2SCy Schubert 	if(ret) {
3454c0caa2e2SCy Schubert 		if(ret != NGHTTP2_ERR_EOF &&
3455c0caa2e2SCy Schubert 			ret != NGHTTP2_ERR_CALLBACK_FAILURE) {
3456369c6923SCy Schubert 			char a[256];
3457865f46b2SCy Schubert 			addr_to_str(&c->repinfo.remote_addr,
3458865f46b2SCy Schubert 				c->repinfo.remote_addrlen, a, sizeof(a));
3459369c6923SCy Schubert 			verbose(VERB_QUERY, "http2: session_recv from %s failed, "
3460369c6923SCy Schubert 				"error: %s", a, nghttp2_strerror(ret));
3461c0caa2e2SCy Schubert 		}
3462c0caa2e2SCy Schubert 		return 0;
3463c0caa2e2SCy Schubert 	}
3464c0caa2e2SCy Schubert 	if(nghttp2_session_want_write(c->h2_session->session)) {
3465c0caa2e2SCy Schubert 		c->tcp_is_reading = 0;
3466c0caa2e2SCy Schubert 		comm_point_stop_listening(c);
3467f44e67d1SCy Schubert 		comm_point_start_listening(c, -1, adjusted_tcp_timeout(c));
3468c0caa2e2SCy Schubert 	} else if(!nghttp2_session_want_read(c->h2_session->session))
3469c0caa2e2SCy Schubert 		return 0; /* connection can be closed */
3470c0caa2e2SCy Schubert 	return 1;
3471c0caa2e2SCy Schubert #else
3472c0caa2e2SCy Schubert 	(void)c;
3473c0caa2e2SCy Schubert 	return 0;
3474c0caa2e2SCy Schubert #endif
3475c0caa2e2SCy Schubert }
3476c0caa2e2SCy Schubert 
347757bddd21SDag-Erling Smørgrav /**
347857bddd21SDag-Erling Smørgrav  * Handle http reading callback.
347957bddd21SDag-Erling Smørgrav  * @param fd: file descriptor of socket.
348057bddd21SDag-Erling Smørgrav  * @param c: comm point to read from into buffer.
348157bddd21SDag-Erling Smørgrav  * @return: 0 on error
348257bddd21SDag-Erling Smørgrav  */
348357bddd21SDag-Erling Smørgrav static int
348457bddd21SDag-Erling Smørgrav comm_point_http_handle_read(int fd, struct comm_point* c)
348557bddd21SDag-Erling Smørgrav {
348657bddd21SDag-Erling Smørgrav 	log_assert(c->type == comm_http);
348757bddd21SDag-Erling Smørgrav 	log_assert(fd != -1);
348857bddd21SDag-Erling Smørgrav 
348957bddd21SDag-Erling Smørgrav 	/* if we are in ssl handshake, handle SSL handshake */
349057bddd21SDag-Erling Smørgrav #ifdef HAVE_SSL
349157bddd21SDag-Erling Smørgrav 	if(c->ssl && c->ssl_shake_state != comm_ssl_shake_none) {
349257bddd21SDag-Erling Smørgrav 		if(!ssl_handshake(c))
349357bddd21SDag-Erling Smørgrav 			return 0;
349457bddd21SDag-Erling Smørgrav 		if(c->ssl_shake_state != comm_ssl_shake_none)
349557bddd21SDag-Erling Smørgrav 			return 1;
349657bddd21SDag-Erling Smørgrav 	}
349757bddd21SDag-Erling Smørgrav #endif /* HAVE_SSL */
349857bddd21SDag-Erling Smørgrav 
349957bddd21SDag-Erling Smørgrav 	if(!c->tcp_is_reading)
350057bddd21SDag-Erling Smørgrav 		return 1;
3501c0caa2e2SCy Schubert 
3502c0caa2e2SCy Schubert 	if(c->use_h2) {
3503c0caa2e2SCy Schubert 		return comm_point_http2_handle_read(fd, c);
3504c0caa2e2SCy Schubert 	}
3505c0caa2e2SCy Schubert 
3506c0caa2e2SCy Schubert 	/* http version is <= http/1.1 */
3507c0caa2e2SCy Schubert 
3508c0caa2e2SCy Schubert 	if(c->http_min_version >= http_version_2) {
3509c0caa2e2SCy Schubert 		/* HTTP/2 failed, not allowed to use lower version. */
3510c0caa2e2SCy Schubert 		return 0;
3511c0caa2e2SCy Schubert 	}
3512c0caa2e2SCy Schubert 
351357bddd21SDag-Erling Smørgrav 	/* read more data */
351457bddd21SDag-Erling Smørgrav 	if(c->ssl) {
351557bddd21SDag-Erling Smørgrav 		if(!ssl_http_read_more(c))
351657bddd21SDag-Erling Smørgrav 			return 0;
351757bddd21SDag-Erling Smørgrav 	} else {
351857bddd21SDag-Erling Smørgrav 		if(!http_read_more(fd, c))
351957bddd21SDag-Erling Smørgrav 			return 0;
352057bddd21SDag-Erling Smørgrav 	}
352157bddd21SDag-Erling Smørgrav 
35225469a995SCy Schubert 	if(c->http_stored >= sldns_buffer_position(c->buffer)) {
35235469a995SCy Schubert 		/* read did not work but we wanted more data, there is
35245469a995SCy Schubert 		 * no bytes to process now. */
35255469a995SCy Schubert 		return 1;
35265469a995SCy Schubert 	}
352757bddd21SDag-Erling Smørgrav 	sldns_buffer_flip(c->buffer);
3528f44e67d1SCy Schubert 	/* if we are partway in a segment of data, position us at the point
3529f44e67d1SCy Schubert 	 * where we left off previously */
3530f44e67d1SCy Schubert 	if(c->http_stored < sldns_buffer_limit(c->buffer))
3531f44e67d1SCy Schubert 		sldns_buffer_set_position(c->buffer, c->http_stored);
3532f44e67d1SCy Schubert 	else	sldns_buffer_set_position(c->buffer, sldns_buffer_limit(c->buffer));
3533c0caa2e2SCy Schubert 
353457bddd21SDag-Erling Smørgrav 	while(sldns_buffer_remaining(c->buffer) > 0) {
3535c0caa2e2SCy Schubert 		/* Handle HTTP/1.x data */
353657bddd21SDag-Erling Smørgrav 		/* if we are reading headers, read more headers */
353757bddd21SDag-Erling Smørgrav 		if(c->http_in_headers || c->http_in_chunk_headers) {
353857bddd21SDag-Erling Smørgrav 			/* if header is done, process the header */
353957bddd21SDag-Erling Smørgrav 			if(!http_header_done(c->buffer)) {
354057bddd21SDag-Erling Smørgrav 				/* copy remaining data to front of buffer
354157bddd21SDag-Erling Smørgrav 				 * and set rest for writing into it */
354257bddd21SDag-Erling Smørgrav 				http_moveover_buffer(c->buffer);
354357bddd21SDag-Erling Smørgrav 				/* return and wait to read more */
354457bddd21SDag-Erling Smørgrav 				return 1;
354557bddd21SDag-Erling Smørgrav 			}
354657bddd21SDag-Erling Smørgrav 			if(!c->http_in_chunk_headers) {
354757bddd21SDag-Erling Smørgrav 				/* process initial headers */
354857bddd21SDag-Erling Smørgrav 				if(!http_process_initial_header(c))
354957bddd21SDag-Erling Smørgrav 					return 0;
355057bddd21SDag-Erling Smørgrav 			} else {
355157bddd21SDag-Erling Smørgrav 				/* process chunk headers */
355257bddd21SDag-Erling Smørgrav 				int r = http_process_chunk_header(c);
355357bddd21SDag-Erling Smørgrav 				if(r == 0) return 0;
355457bddd21SDag-Erling Smørgrav 				if(r == 2) return 1; /* done */
355557bddd21SDag-Erling Smørgrav 				/* r == 1, continue */
355657bddd21SDag-Erling Smørgrav 			}
355757bddd21SDag-Erling Smørgrav 			/* see if we have more to process */
355857bddd21SDag-Erling Smørgrav 			continue;
355957bddd21SDag-Erling Smørgrav 		}
356057bddd21SDag-Erling Smørgrav 
356157bddd21SDag-Erling Smørgrav 		if(!c->http_is_chunked) {
356257bddd21SDag-Erling Smørgrav 			/* if we are reading nonchunks, process that*/
356357bddd21SDag-Erling Smørgrav 			return http_nonchunk_segment(c);
356457bddd21SDag-Erling Smørgrav 		} else {
356557bddd21SDag-Erling Smørgrav 			/* if we are reading chunks, read the chunk */
356657bddd21SDag-Erling Smørgrav 			int r = http_chunked_segment(c);
356757bddd21SDag-Erling Smørgrav 			if(r == 0) return 0;
356857bddd21SDag-Erling Smørgrav 			if(r == 1) return 1;
356957bddd21SDag-Erling Smørgrav 			continue;
357057bddd21SDag-Erling Smørgrav 		}
357157bddd21SDag-Erling Smørgrav 	}
357257bddd21SDag-Erling Smørgrav 	/* broke out of the loop; could not process header instead need
357357bddd21SDag-Erling Smørgrav 	 * to read more */
357457bddd21SDag-Erling Smørgrav 	/* moveover any remaining data and read more data */
357557bddd21SDag-Erling Smørgrav 	http_moveover_buffer(c->buffer);
357657bddd21SDag-Erling Smørgrav 	/* return and wait to read more */
357757bddd21SDag-Erling Smørgrav 	return 1;
357857bddd21SDag-Erling Smørgrav }
357957bddd21SDag-Erling Smørgrav 
358057bddd21SDag-Erling Smørgrav /** check pending connect for http */
358157bddd21SDag-Erling Smørgrav static int
358257bddd21SDag-Erling Smørgrav http_check_connect(int fd, struct comm_point* c)
358357bddd21SDag-Erling Smørgrav {
358457bddd21SDag-Erling Smørgrav 	/* check for pending error from nonblocking connect */
358557bddd21SDag-Erling Smørgrav 	/* from Stevens, unix network programming, vol1, 3rd ed, p450*/
358657bddd21SDag-Erling Smørgrav 	int error = 0;
358757bddd21SDag-Erling Smørgrav 	socklen_t len = (socklen_t)sizeof(error);
358857bddd21SDag-Erling Smørgrav 	if(getsockopt(fd, SOL_SOCKET, SO_ERROR, (void*)&error,
358957bddd21SDag-Erling Smørgrav 		&len) < 0){
359057bddd21SDag-Erling Smørgrav #ifndef USE_WINSOCK
359157bddd21SDag-Erling Smørgrav 		error = errno; /* on solaris errno is error */
359257bddd21SDag-Erling Smørgrav #else /* USE_WINSOCK */
359357bddd21SDag-Erling Smørgrav 		error = WSAGetLastError();
359457bddd21SDag-Erling Smørgrav #endif
359557bddd21SDag-Erling Smørgrav 	}
359657bddd21SDag-Erling Smørgrav #ifndef USE_WINSOCK
359757bddd21SDag-Erling Smørgrav #if defined(EINPROGRESS) && defined(EWOULDBLOCK)
359857bddd21SDag-Erling Smørgrav 	if(error == EINPROGRESS || error == EWOULDBLOCK)
359957bddd21SDag-Erling Smørgrav 		return 1; /* try again later */
360057bddd21SDag-Erling Smørgrav 	else
360157bddd21SDag-Erling Smørgrav #endif
360257bddd21SDag-Erling Smørgrav 	if(error != 0 && verbosity < 2)
360357bddd21SDag-Erling Smørgrav 		return 0; /* silence lots of chatter in the logs */
360457bddd21SDag-Erling Smørgrav 	else if(error != 0) {
360557bddd21SDag-Erling Smørgrav 		log_err_addr("http connect", strerror(error),
3606865f46b2SCy Schubert 			&c->repinfo.remote_addr, c->repinfo.remote_addrlen);
360757bddd21SDag-Erling Smørgrav #else /* USE_WINSOCK */
360857bddd21SDag-Erling Smørgrav 	/* examine error */
360957bddd21SDag-Erling Smørgrav 	if(error == WSAEINPROGRESS)
361057bddd21SDag-Erling Smørgrav 		return 1;
361157bddd21SDag-Erling Smørgrav 	else if(error == WSAEWOULDBLOCK) {
361257bddd21SDag-Erling Smørgrav 		ub_winsock_tcp_wouldblock(c->ev->ev, UB_EV_WRITE);
361357bddd21SDag-Erling Smørgrav 		return 1;
361457bddd21SDag-Erling Smørgrav 	} else if(error != 0 && verbosity < 2)
361557bddd21SDag-Erling Smørgrav 		return 0;
361657bddd21SDag-Erling Smørgrav 	else if(error != 0) {
361757bddd21SDag-Erling Smørgrav 		log_err_addr("http connect", wsa_strerror(error),
3618865f46b2SCy Schubert 			&c->repinfo.remote_addr, c->repinfo.remote_addrlen);
361957bddd21SDag-Erling Smørgrav #endif /* USE_WINSOCK */
362057bddd21SDag-Erling Smørgrav 		return 0;
362157bddd21SDag-Erling Smørgrav 	}
362257bddd21SDag-Erling Smørgrav 	/* keep on processing this socket */
362357bddd21SDag-Erling Smørgrav 	return 2;
362457bddd21SDag-Erling Smørgrav }
362557bddd21SDag-Erling Smørgrav 
362657bddd21SDag-Erling Smørgrav /** write more data for http (with ssl) */
362757bddd21SDag-Erling Smørgrav static int
362857bddd21SDag-Erling Smørgrav ssl_http_write_more(struct comm_point* c)
362957bddd21SDag-Erling Smørgrav {
363057bddd21SDag-Erling Smørgrav #ifdef HAVE_SSL
363157bddd21SDag-Erling Smørgrav 	int r;
363257bddd21SDag-Erling Smørgrav 	log_assert(sldns_buffer_remaining(c->buffer) > 0);
363357bddd21SDag-Erling Smørgrav 	ERR_clear_error();
363457bddd21SDag-Erling Smørgrav 	r = SSL_write(c->ssl, (void*)sldns_buffer_current(c->buffer),
363557bddd21SDag-Erling Smørgrav 		(int)sldns_buffer_remaining(c->buffer));
363657bddd21SDag-Erling Smørgrav 	if(r <= 0) {
363757bddd21SDag-Erling Smørgrav 		int want = SSL_get_error(c->ssl, r);
363857bddd21SDag-Erling Smørgrav 		if(want == SSL_ERROR_ZERO_RETURN) {
363957bddd21SDag-Erling Smørgrav 			return 0; /* closed */
364057bddd21SDag-Erling Smørgrav 		} else if(want == SSL_ERROR_WANT_READ) {
3641e86b9096SDag-Erling Smørgrav 			c->ssl_shake_state = comm_ssl_shake_hs_read;
364257bddd21SDag-Erling Smørgrav 			comm_point_listen_for_rw(c, 1, 0);
364357bddd21SDag-Erling Smørgrav 			return 1; /* wait for read condition */
364457bddd21SDag-Erling Smørgrav 		} else if(want == SSL_ERROR_WANT_WRITE) {
364557bddd21SDag-Erling Smørgrav 			return 1; /* write more later */
364657bddd21SDag-Erling Smørgrav 		} else if(want == SSL_ERROR_SYSCALL) {
3647e86b9096SDag-Erling Smørgrav #ifdef EPIPE
3648e86b9096SDag-Erling Smørgrav 			if(errno == EPIPE && verbosity < 2)
3649e86b9096SDag-Erling Smørgrav 				return 0; /* silence 'broken pipe' */
3650e86b9096SDag-Erling Smørgrav #endif
365157bddd21SDag-Erling Smørgrav 			if(errno != 0)
365257bddd21SDag-Erling Smørgrav 				log_err("SSL_write syscall: %s",
365357bddd21SDag-Erling Smørgrav 					strerror(errno));
365457bddd21SDag-Erling Smørgrav 			return 0;
365557bddd21SDag-Erling Smørgrav 		}
3656103ba509SCy Schubert 		log_crypto_err_io("could not SSL_write", want);
365757bddd21SDag-Erling Smørgrav 		return 0;
365857bddd21SDag-Erling Smørgrav 	}
365957bddd21SDag-Erling Smørgrav 	sldns_buffer_skip(c->buffer, (ssize_t)r);
366057bddd21SDag-Erling Smørgrav 	return 1;
366157bddd21SDag-Erling Smørgrav #else
366257bddd21SDag-Erling Smørgrav 	(void)c;
366357bddd21SDag-Erling Smørgrav 	return 0;
366457bddd21SDag-Erling Smørgrav #endif /* HAVE_SSL */
366557bddd21SDag-Erling Smørgrav }
366657bddd21SDag-Erling Smørgrav 
366757bddd21SDag-Erling Smørgrav /** write more data for http */
366857bddd21SDag-Erling Smørgrav static int
366957bddd21SDag-Erling Smørgrav http_write_more(int fd, struct comm_point* c)
367057bddd21SDag-Erling Smørgrav {
367157bddd21SDag-Erling Smørgrav 	ssize_t r;
367257bddd21SDag-Erling Smørgrav 	log_assert(sldns_buffer_remaining(c->buffer) > 0);
367357bddd21SDag-Erling Smørgrav 	r = send(fd, (void*)sldns_buffer_current(c->buffer),
367457bddd21SDag-Erling Smørgrav 		sldns_buffer_remaining(c->buffer), 0);
367557bddd21SDag-Erling Smørgrav 	if(r == -1) {
367657bddd21SDag-Erling Smørgrav #ifndef USE_WINSOCK
367757bddd21SDag-Erling Smørgrav 		if(errno == EINTR || errno == EAGAIN)
367857bddd21SDag-Erling Smørgrav 			return 1;
367957bddd21SDag-Erling Smørgrav #else
368057bddd21SDag-Erling Smørgrav 		if(WSAGetLastError() == WSAEINPROGRESS)
368157bddd21SDag-Erling Smørgrav 			return 1;
368257bddd21SDag-Erling Smørgrav 		if(WSAGetLastError() == WSAEWOULDBLOCK) {
368357bddd21SDag-Erling Smørgrav 			ub_winsock_tcp_wouldblock(c->ev->ev, UB_EV_WRITE);
368457bddd21SDag-Erling Smørgrav 			return 1;
368557bddd21SDag-Erling Smørgrav 		}
368657bddd21SDag-Erling Smørgrav #endif
3687c0caa2e2SCy Schubert 		log_err_addr("http send r", sock_strerror(errno),
3688865f46b2SCy Schubert 			&c->repinfo.remote_addr, c->repinfo.remote_addrlen);
368957bddd21SDag-Erling Smørgrav 		return 0;
369057bddd21SDag-Erling Smørgrav 	}
369157bddd21SDag-Erling Smørgrav 	sldns_buffer_skip(c->buffer, r);
369257bddd21SDag-Erling Smørgrav 	return 1;
369357bddd21SDag-Erling Smørgrav }
369457bddd21SDag-Erling Smørgrav 
3695c0caa2e2SCy Schubert #ifdef HAVE_NGHTTP2
3696c0caa2e2SCy Schubert ssize_t http2_send_cb(nghttp2_session* ATTR_UNUSED(session), const uint8_t* buf,
3697c0caa2e2SCy Schubert 	size_t len, int ATTR_UNUSED(flags), void* cb_arg)
3698c0caa2e2SCy Schubert {
3699369c6923SCy Schubert 	ssize_t ret;
3700c0caa2e2SCy Schubert 	struct http2_session* h2_session = (struct http2_session*)cb_arg;
3701c0caa2e2SCy Schubert 	log_assert(h2_session->c->type == comm_http);
3702c0caa2e2SCy Schubert 	log_assert(h2_session->c->h2_session);
3703c0caa2e2SCy Schubert 
3704369c6923SCy Schubert #ifdef HAVE_SSL
3705369c6923SCy Schubert 	if(h2_session->c->ssl) {
3706369c6923SCy Schubert 		int r;
3707c0caa2e2SCy Schubert 		ERR_clear_error();
3708c0caa2e2SCy Schubert 		r = SSL_write(h2_session->c->ssl, buf, len);
3709c0caa2e2SCy Schubert 		if(r <= 0) {
3710c0caa2e2SCy Schubert 			int want = SSL_get_error(h2_session->c->ssl, r);
3711c0caa2e2SCy Schubert 			if(want == SSL_ERROR_ZERO_RETURN) {
3712c0caa2e2SCy Schubert 				return NGHTTP2_ERR_CALLBACK_FAILURE;
3713c0caa2e2SCy Schubert 			} else if(want == SSL_ERROR_WANT_READ) {
3714c0caa2e2SCy Schubert 				h2_session->c->ssl_shake_state = comm_ssl_shake_hs_read;
3715c0caa2e2SCy Schubert 				comm_point_listen_for_rw(h2_session->c, 1, 0);
3716c0caa2e2SCy Schubert 				return NGHTTP2_ERR_WOULDBLOCK;
3717c0caa2e2SCy Schubert 			} else if(want == SSL_ERROR_WANT_WRITE) {
3718c0caa2e2SCy Schubert 				return NGHTTP2_ERR_WOULDBLOCK;
3719c0caa2e2SCy Schubert 			} else if(want == SSL_ERROR_SYSCALL) {
3720c0caa2e2SCy Schubert #ifdef EPIPE
3721c0caa2e2SCy Schubert 				if(errno == EPIPE && verbosity < 2)
3722c0caa2e2SCy Schubert 					return NGHTTP2_ERR_CALLBACK_FAILURE;
3723c0caa2e2SCy Schubert #endif
3724c0caa2e2SCy Schubert 				if(errno != 0)
3725c0caa2e2SCy Schubert 					log_err("SSL_write syscall: %s",
3726c0caa2e2SCy Schubert 						strerror(errno));
3727c0caa2e2SCy Schubert 				return NGHTTP2_ERR_CALLBACK_FAILURE;
3728c0caa2e2SCy Schubert 			}
3729103ba509SCy Schubert 			log_crypto_err_io("could not SSL_write", want);
3730c0caa2e2SCy Schubert 			return NGHTTP2_ERR_CALLBACK_FAILURE;
3731c0caa2e2SCy Schubert 		}
3732c0caa2e2SCy Schubert 		return r;
3733369c6923SCy Schubert 	}
3734369c6923SCy Schubert #endif /* HAVE_SSL */
3735369c6923SCy Schubert 
3736369c6923SCy Schubert 	ret = send(h2_session->c->fd, buf, len, 0);
3737369c6923SCy Schubert 	if(ret == 0) {
3738369c6923SCy Schubert 		return NGHTTP2_ERR_CALLBACK_FAILURE;
3739369c6923SCy Schubert 	} else if(ret < 0) {
3740369c6923SCy Schubert #ifndef USE_WINSOCK
3741369c6923SCy Schubert 		if(errno == EINTR || errno == EAGAIN)
3742369c6923SCy Schubert 			return NGHTTP2_ERR_WOULDBLOCK;
3743369c6923SCy Schubert #ifdef EPIPE
3744369c6923SCy Schubert 		if(errno == EPIPE && verbosity < 2)
3745369c6923SCy Schubert 			return NGHTTP2_ERR_CALLBACK_FAILURE;
3746c0caa2e2SCy Schubert #endif
3747369c6923SCy Schubert #ifdef ECONNRESET
3748369c6923SCy Schubert 		if(errno == ECONNRESET && verbosity < 2)
3749369c6923SCy Schubert 			return NGHTTP2_ERR_CALLBACK_FAILURE;
3750369c6923SCy Schubert #endif
3751369c6923SCy Schubert 		log_err_addr("could not http2 write: %s", strerror(errno),
3752865f46b2SCy Schubert 			&h2_session->c->repinfo.remote_addr,
3753865f46b2SCy Schubert 			h2_session->c->repinfo.remote_addrlen);
3754369c6923SCy Schubert #else /* USE_WINSOCK */
3755369c6923SCy Schubert 		if(WSAGetLastError() == WSAENOTCONN)
3756369c6923SCy Schubert 			return NGHTTP2_ERR_WOULDBLOCK;
3757369c6923SCy Schubert 		if(WSAGetLastError() == WSAEINPROGRESS)
3758369c6923SCy Schubert 			return NGHTTP2_ERR_WOULDBLOCK;
3759369c6923SCy Schubert 		if(WSAGetLastError() == WSAEWOULDBLOCK) {
3760369c6923SCy Schubert 			ub_winsock_tcp_wouldblock(h2_session->c->ev->ev,
3761369c6923SCy Schubert 				UB_EV_WRITE);
3762369c6923SCy Schubert 			return NGHTTP2_ERR_WOULDBLOCK;
3763369c6923SCy Schubert 		}
3764369c6923SCy Schubert 		if(WSAGetLastError() == WSAECONNRESET && verbosity < 2)
3765369c6923SCy Schubert 			return NGHTTP2_ERR_CALLBACK_FAILURE;
3766369c6923SCy Schubert 		log_err_addr("could not http2 write: %s",
3767369c6923SCy Schubert 			wsa_strerror(WSAGetLastError()),
3768865f46b2SCy Schubert 			&h2_session->c->repinfo.remote_addr,
3769865f46b2SCy Schubert 			h2_session->c->repinfo.remote_addrlen);
3770369c6923SCy Schubert #endif
3771369c6923SCy Schubert 		return NGHTTP2_ERR_CALLBACK_FAILURE;
3772369c6923SCy Schubert 	}
3773369c6923SCy Schubert 	return ret;
3774c0caa2e2SCy Schubert }
3775c0caa2e2SCy Schubert #endif /* HAVE_NGHTTP2 */
3776c0caa2e2SCy Schubert 
3777c0caa2e2SCy Schubert /** Handle http2 writing */
3778c0caa2e2SCy Schubert static int
3779c0caa2e2SCy Schubert comm_point_http2_handle_write(int ATTR_UNUSED(fd), struct comm_point* c)
3780c0caa2e2SCy Schubert {
3781c0caa2e2SCy Schubert #ifdef HAVE_NGHTTP2
3782c0caa2e2SCy Schubert 	int ret;
3783c0caa2e2SCy Schubert 	log_assert(c->h2_session);
3784c0caa2e2SCy Schubert 
3785c0caa2e2SCy Schubert 	ret = nghttp2_session_send(c->h2_session->session);
3786c0caa2e2SCy Schubert 	if(ret) {
3787c0caa2e2SCy Schubert 		verbose(VERB_QUERY, "http2: session_send failed, "
3788c0caa2e2SCy Schubert 			"error: %s", nghttp2_strerror(ret));
3789c0caa2e2SCy Schubert 		return 0;
3790c0caa2e2SCy Schubert 	}
3791c0caa2e2SCy Schubert 
3792c0caa2e2SCy Schubert 	if(nghttp2_session_want_read(c->h2_session->session)) {
3793c0caa2e2SCy Schubert 		c->tcp_is_reading = 1;
3794c0caa2e2SCy Schubert 		comm_point_stop_listening(c);
3795f44e67d1SCy Schubert 		comm_point_start_listening(c, -1, adjusted_tcp_timeout(c));
3796c0caa2e2SCy Schubert 	} else if(!nghttp2_session_want_write(c->h2_session->session))
3797c0caa2e2SCy Schubert 		return 0; /* connection can be closed */
3798c0caa2e2SCy Schubert 	return 1;
3799c0caa2e2SCy Schubert #else
3800c0caa2e2SCy Schubert 	(void)c;
3801c0caa2e2SCy Schubert 	return 0;
3802c0caa2e2SCy Schubert #endif
3803c0caa2e2SCy Schubert }
3804c0caa2e2SCy Schubert 
380557bddd21SDag-Erling Smørgrav /**
380657bddd21SDag-Erling Smørgrav  * Handle http writing callback.
380757bddd21SDag-Erling Smørgrav  * @param fd: file descriptor of socket.
380857bddd21SDag-Erling Smørgrav  * @param c: comm point to write buffer out of.
380957bddd21SDag-Erling Smørgrav  * @return: 0 on error
381057bddd21SDag-Erling Smørgrav  */
381157bddd21SDag-Erling Smørgrav static int
381257bddd21SDag-Erling Smørgrav comm_point_http_handle_write(int fd, struct comm_point* c)
381357bddd21SDag-Erling Smørgrav {
381457bddd21SDag-Erling Smørgrav 	log_assert(c->type == comm_http);
381557bddd21SDag-Erling Smørgrav 	log_assert(fd != -1);
381657bddd21SDag-Erling Smørgrav 
381757bddd21SDag-Erling Smørgrav 	/* check pending connect errors, if that fails, we wait for more,
381857bddd21SDag-Erling Smørgrav 	 * or we can continue to write contents */
381957bddd21SDag-Erling Smørgrav 	if(c->tcp_check_nb_connect) {
382057bddd21SDag-Erling Smørgrav 		int r = http_check_connect(fd, c);
382157bddd21SDag-Erling Smørgrav 		if(r == 0) return 0;
382257bddd21SDag-Erling Smørgrav 		if(r == 1) return 1;
382357bddd21SDag-Erling Smørgrav 		c->tcp_check_nb_connect = 0;
382457bddd21SDag-Erling Smørgrav 	}
382557bddd21SDag-Erling Smørgrav 	/* if we are in ssl handshake, handle SSL handshake */
382657bddd21SDag-Erling Smørgrav #ifdef HAVE_SSL
382757bddd21SDag-Erling Smørgrav 	if(c->ssl && c->ssl_shake_state != comm_ssl_shake_none) {
382857bddd21SDag-Erling Smørgrav 		if(!ssl_handshake(c))
382957bddd21SDag-Erling Smørgrav 			return 0;
383057bddd21SDag-Erling Smørgrav 		if(c->ssl_shake_state != comm_ssl_shake_none)
383157bddd21SDag-Erling Smørgrav 			return 1;
383257bddd21SDag-Erling Smørgrav 	}
383357bddd21SDag-Erling Smørgrav #endif /* HAVE_SSL */
383457bddd21SDag-Erling Smørgrav 	if(c->tcp_is_reading)
383557bddd21SDag-Erling Smørgrav 		return 1;
3836c0caa2e2SCy Schubert 
3837c0caa2e2SCy Schubert 	if(c->use_h2) {
3838c0caa2e2SCy Schubert 		return comm_point_http2_handle_write(fd, c);
3839c0caa2e2SCy Schubert 	}
3840c0caa2e2SCy Schubert 
3841c0caa2e2SCy Schubert 	/* http version is <= http/1.1 */
3842c0caa2e2SCy Schubert 
3843c0caa2e2SCy Schubert 	if(c->http_min_version >= http_version_2) {
3844c0caa2e2SCy Schubert 		/* HTTP/2 failed, not allowed to use lower version. */
3845c0caa2e2SCy Schubert 		return 0;
3846c0caa2e2SCy Schubert 	}
3847c0caa2e2SCy Schubert 
384857bddd21SDag-Erling Smørgrav 	/* if we are writing, write more */
384957bddd21SDag-Erling Smørgrav 	if(c->ssl) {
385057bddd21SDag-Erling Smørgrav 		if(!ssl_http_write_more(c))
385157bddd21SDag-Erling Smørgrav 			return 0;
385257bddd21SDag-Erling Smørgrav 	} else {
385357bddd21SDag-Erling Smørgrav 		if(!http_write_more(fd, c))
385457bddd21SDag-Erling Smørgrav 			return 0;
385557bddd21SDag-Erling Smørgrav 	}
385657bddd21SDag-Erling Smørgrav 
385757bddd21SDag-Erling Smørgrav 	/* we write a single buffer contents, that can contain
385857bddd21SDag-Erling Smørgrav 	 * the http request, and then flip to read the results */
385957bddd21SDag-Erling Smørgrav 	/* see if write is done */
386057bddd21SDag-Erling Smørgrav 	if(sldns_buffer_remaining(c->buffer) == 0) {
386157bddd21SDag-Erling Smørgrav 		sldns_buffer_clear(c->buffer);
386257bddd21SDag-Erling Smørgrav 		if(c->tcp_do_toggle_rw)
386357bddd21SDag-Erling Smørgrav 			c->tcp_is_reading = 1;
386457bddd21SDag-Erling Smørgrav 		c->tcp_byte_count = 0;
386557bddd21SDag-Erling Smørgrav 		/* switch from listening(write) to listening(read) */
386657bddd21SDag-Erling Smørgrav 		comm_point_stop_listening(c);
386757bddd21SDag-Erling Smørgrav 		comm_point_start_listening(c, -1, -1);
386857bddd21SDag-Erling Smørgrav 	}
386957bddd21SDag-Erling Smørgrav 	return 1;
387057bddd21SDag-Erling Smørgrav }
387157bddd21SDag-Erling Smørgrav 
387257bddd21SDag-Erling Smørgrav void
387357bddd21SDag-Erling Smørgrav comm_point_http_handle_callback(int fd, short event, void* arg)
387457bddd21SDag-Erling Smørgrav {
387557bddd21SDag-Erling Smørgrav 	struct comm_point* c = (struct comm_point*)arg;
387657bddd21SDag-Erling Smørgrav 	log_assert(c->type == comm_http);
387757bddd21SDag-Erling Smørgrav 	ub_comm_base_now(c->ev->base);
387857bddd21SDag-Erling Smørgrav 
3879e86b9096SDag-Erling Smørgrav 	if(event&UB_EV_TIMEOUT) {
3880e86b9096SDag-Erling Smørgrav 		verbose(VERB_QUERY, "http took too long, dropped");
3881e86b9096SDag-Erling Smørgrav 		reclaim_http_handler(c);
3882e86b9096SDag-Erling Smørgrav 		if(!c->tcp_do_close) {
3883e86b9096SDag-Erling Smørgrav 			fptr_ok(fptr_whitelist_comm_point(c->callback));
3884e86b9096SDag-Erling Smørgrav 			(void)(*c->callback)(c, c->cb_arg,
3885e86b9096SDag-Erling Smørgrav 				NETEVENT_TIMEOUT, NULL);
3886e86b9096SDag-Erling Smørgrav 		}
3887e86b9096SDag-Erling Smørgrav 		return;
3888e86b9096SDag-Erling Smørgrav 	}
388957bddd21SDag-Erling Smørgrav 	if(event&UB_EV_READ) {
389057bddd21SDag-Erling Smørgrav 		if(!comm_point_http_handle_read(fd, c)) {
389157bddd21SDag-Erling Smørgrav 			reclaim_http_handler(c);
389257bddd21SDag-Erling Smørgrav 			if(!c->tcp_do_close) {
389357bddd21SDag-Erling Smørgrav 				fptr_ok(fptr_whitelist_comm_point(
389457bddd21SDag-Erling Smørgrav 					c->callback));
389557bddd21SDag-Erling Smørgrav 				(void)(*c->callback)(c, c->cb_arg,
389657bddd21SDag-Erling Smørgrav 					NETEVENT_CLOSED, NULL);
389757bddd21SDag-Erling Smørgrav 			}
389857bddd21SDag-Erling Smørgrav 		}
389957bddd21SDag-Erling Smørgrav 		return;
390057bddd21SDag-Erling Smørgrav 	}
390157bddd21SDag-Erling Smørgrav 	if(event&UB_EV_WRITE) {
390257bddd21SDag-Erling Smørgrav 		if(!comm_point_http_handle_write(fd, c)) {
390357bddd21SDag-Erling Smørgrav 			reclaim_http_handler(c);
390457bddd21SDag-Erling Smørgrav 			if(!c->tcp_do_close) {
390557bddd21SDag-Erling Smørgrav 				fptr_ok(fptr_whitelist_comm_point(
390657bddd21SDag-Erling Smørgrav 					c->callback));
390757bddd21SDag-Erling Smørgrav 				(void)(*c->callback)(c, c->cb_arg,
390857bddd21SDag-Erling Smørgrav 					NETEVENT_CLOSED, NULL);
390957bddd21SDag-Erling Smørgrav 			}
391057bddd21SDag-Erling Smørgrav 		}
391157bddd21SDag-Erling Smørgrav 		return;
391257bddd21SDag-Erling Smørgrav 	}
391357bddd21SDag-Erling Smørgrav 	log_err("Ignored event %d for httphdl.", event);
391457bddd21SDag-Erling Smørgrav }
391557bddd21SDag-Erling Smørgrav 
3916b7579f77SDag-Erling Smørgrav void comm_point_local_handle_callback(int fd, short event, void* arg)
3917b7579f77SDag-Erling Smørgrav {
3918b7579f77SDag-Erling Smørgrav 	struct comm_point* c = (struct comm_point*)arg;
3919b7579f77SDag-Erling Smørgrav 	log_assert(c->type == comm_local);
3920e2d15004SDag-Erling Smørgrav 	ub_comm_base_now(c->ev->base);
3921b7579f77SDag-Erling Smørgrav 
3922e2d15004SDag-Erling Smørgrav 	if(event&UB_EV_READ) {
3923b7579f77SDag-Erling Smørgrav 		if(!comm_point_tcp_handle_read(fd, c, 1)) {
3924b7579f77SDag-Erling Smørgrav 			fptr_ok(fptr_whitelist_comm_point(c->callback));
3925b7579f77SDag-Erling Smørgrav 			(void)(*c->callback)(c, c->cb_arg, NETEVENT_CLOSED,
3926b7579f77SDag-Erling Smørgrav 				NULL);
3927b7579f77SDag-Erling Smørgrav 		}
3928b7579f77SDag-Erling Smørgrav 		return;
3929b7579f77SDag-Erling Smørgrav 	}
3930b7579f77SDag-Erling Smørgrav 	log_err("Ignored event %d for localhdl.", event);
3931b7579f77SDag-Erling Smørgrav }
3932b7579f77SDag-Erling Smørgrav 
3933b7579f77SDag-Erling Smørgrav void comm_point_raw_handle_callback(int ATTR_UNUSED(fd),
3934b7579f77SDag-Erling Smørgrav 	short event, void* arg)
3935b7579f77SDag-Erling Smørgrav {
3936b7579f77SDag-Erling Smørgrav 	struct comm_point* c = (struct comm_point*)arg;
3937b7579f77SDag-Erling Smørgrav 	int err = NETEVENT_NOERROR;
3938b7579f77SDag-Erling Smørgrav 	log_assert(c->type == comm_raw);
3939e2d15004SDag-Erling Smørgrav 	ub_comm_base_now(c->ev->base);
3940b7579f77SDag-Erling Smørgrav 
3941e2d15004SDag-Erling Smørgrav 	if(event&UB_EV_TIMEOUT)
3942b7579f77SDag-Erling Smørgrav 		err = NETEVENT_TIMEOUT;
3943b7579f77SDag-Erling Smørgrav 	fptr_ok(fptr_whitelist_comm_point_raw(c->callback));
3944b7579f77SDag-Erling Smørgrav 	(void)(*c->callback)(c, c->cb_arg, err, NULL);
3945b7579f77SDag-Erling Smørgrav }
3946b7579f77SDag-Erling Smørgrav 
3947b7579f77SDag-Erling Smørgrav struct comm_point*
394817d15b25SDag-Erling Smørgrav comm_point_create_udp(struct comm_base *base, int fd, sldns_buffer* buffer,
3949865f46b2SCy Schubert 	int pp2_enabled, comm_point_callback_type* callback,
3950865f46b2SCy Schubert 	void* callback_arg, struct unbound_socket* socket)
3951b7579f77SDag-Erling Smørgrav {
3952b7579f77SDag-Erling Smørgrav 	struct comm_point* c = (struct comm_point*)calloc(1,
3953b7579f77SDag-Erling Smørgrav 		sizeof(struct comm_point));
3954b7579f77SDag-Erling Smørgrav 	short evbits;
3955b7579f77SDag-Erling Smørgrav 	if(!c)
3956b7579f77SDag-Erling Smørgrav 		return NULL;
3957b7579f77SDag-Erling Smørgrav 	c->ev = (struct internal_event*)calloc(1,
3958b7579f77SDag-Erling Smørgrav 		sizeof(struct internal_event));
3959b7579f77SDag-Erling Smørgrav 	if(!c->ev) {
3960b7579f77SDag-Erling Smørgrav 		free(c);
3961b7579f77SDag-Erling Smørgrav 		return NULL;
3962b7579f77SDag-Erling Smørgrav 	}
3963b7579f77SDag-Erling Smørgrav 	c->ev->base = base;
3964b7579f77SDag-Erling Smørgrav 	c->fd = fd;
3965b7579f77SDag-Erling Smørgrav 	c->buffer = buffer;
3966b7579f77SDag-Erling Smørgrav 	c->timeout = NULL;
3967b7579f77SDag-Erling Smørgrav 	c->tcp_is_reading = 0;
3968b7579f77SDag-Erling Smørgrav 	c->tcp_byte_count = 0;
3969b7579f77SDag-Erling Smørgrav 	c->tcp_parent = NULL;
3970b7579f77SDag-Erling Smørgrav 	c->max_tcp_count = 0;
397109a3aaf3SDag-Erling Smørgrav 	c->cur_tcp_count = 0;
3972b7579f77SDag-Erling Smørgrav 	c->tcp_handlers = NULL;
3973b7579f77SDag-Erling Smørgrav 	c->tcp_free = NULL;
3974b7579f77SDag-Erling Smørgrav 	c->type = comm_udp;
3975b7579f77SDag-Erling Smørgrav 	c->tcp_do_close = 0;
3976b7579f77SDag-Erling Smørgrav 	c->do_not_close = 0;
3977b7579f77SDag-Erling Smørgrav 	c->tcp_do_toggle_rw = 0;
3978b7579f77SDag-Erling Smørgrav 	c->tcp_check_nb_connect = 0;
3979b5663de9SDag-Erling Smørgrav #ifdef USE_MSG_FASTOPEN
3980b5663de9SDag-Erling Smørgrav 	c->tcp_do_fastopen = 0;
3981b5663de9SDag-Erling Smørgrav #endif
398265b390aaSDag-Erling Smørgrav #ifdef USE_DNSCRYPT
398365b390aaSDag-Erling Smørgrav 	c->dnscrypt = 0;
398465b390aaSDag-Erling Smørgrav 	c->dnscrypt_buffer = buffer;
398565b390aaSDag-Erling Smørgrav #endif
3986b7579f77SDag-Erling Smørgrav 	c->inuse = 0;
3987b7579f77SDag-Erling Smørgrav 	c->callback = callback;
3988b7579f77SDag-Erling Smørgrav 	c->cb_arg = callback_arg;
39895469a995SCy Schubert 	c->socket = socket;
3990865f46b2SCy Schubert 	c->pp2_enabled = pp2_enabled;
3991865f46b2SCy Schubert 	c->pp2_header_state = pp2_header_none;
3992e2d15004SDag-Erling Smørgrav 	evbits = UB_EV_READ | UB_EV_PERSIST;
3993e2d15004SDag-Erling Smørgrav 	/* ub_event stuff */
3994e2d15004SDag-Erling Smørgrav 	c->ev->ev = ub_event_new(base->eb->base, c->fd, evbits,
3995e2d15004SDag-Erling Smørgrav 		comm_point_udp_callback, c);
3996e2d15004SDag-Erling Smørgrav 	if(c->ev->ev == NULL) {
3997b7579f77SDag-Erling Smørgrav 		log_err("could not baseset udp event");
3998b7579f77SDag-Erling Smørgrav 		comm_point_delete(c);
3999b7579f77SDag-Erling Smørgrav 		return NULL;
4000b7579f77SDag-Erling Smørgrav 	}
4001e2d15004SDag-Erling Smørgrav 	if(fd!=-1 && ub_event_add(c->ev->ev, c->timeout) != 0 ) {
4002b7579f77SDag-Erling Smørgrav 		log_err("could not add udp event");
4003b7579f77SDag-Erling Smørgrav 		comm_point_delete(c);
4004b7579f77SDag-Erling Smørgrav 		return NULL;
4005b7579f77SDag-Erling Smørgrav 	}
4006f44e67d1SCy Schubert 	c->event_added = 1;
4007b7579f77SDag-Erling Smørgrav 	return c;
4008b7579f77SDag-Erling Smørgrav }
4009b7579f77SDag-Erling Smørgrav 
4010103ba509SCy Schubert #if defined(AF_INET6) && defined(IPV6_PKTINFO) && defined(HAVE_RECVMSG)
4011b7579f77SDag-Erling Smørgrav struct comm_point*
4012b7579f77SDag-Erling Smørgrav comm_point_create_udp_ancil(struct comm_base *base, int fd,
4013865f46b2SCy Schubert 	sldns_buffer* buffer, int pp2_enabled,
40145469a995SCy Schubert 	comm_point_callback_type* callback, void* callback_arg, struct unbound_socket* socket)
4015b7579f77SDag-Erling Smørgrav {
4016b7579f77SDag-Erling Smørgrav 	struct comm_point* c = (struct comm_point*)calloc(1,
4017b7579f77SDag-Erling Smørgrav 		sizeof(struct comm_point));
4018b7579f77SDag-Erling Smørgrav 	short evbits;
4019b7579f77SDag-Erling Smørgrav 	if(!c)
4020b7579f77SDag-Erling Smørgrav 		return NULL;
4021b7579f77SDag-Erling Smørgrav 	c->ev = (struct internal_event*)calloc(1,
4022b7579f77SDag-Erling Smørgrav 		sizeof(struct internal_event));
4023b7579f77SDag-Erling Smørgrav 	if(!c->ev) {
4024b7579f77SDag-Erling Smørgrav 		free(c);
4025b7579f77SDag-Erling Smørgrav 		return NULL;
4026b7579f77SDag-Erling Smørgrav 	}
4027b7579f77SDag-Erling Smørgrav 	c->ev->base = base;
4028b7579f77SDag-Erling Smørgrav 	c->fd = fd;
4029b7579f77SDag-Erling Smørgrav 	c->buffer = buffer;
4030b7579f77SDag-Erling Smørgrav 	c->timeout = NULL;
4031b7579f77SDag-Erling Smørgrav 	c->tcp_is_reading = 0;
4032b7579f77SDag-Erling Smørgrav 	c->tcp_byte_count = 0;
4033b7579f77SDag-Erling Smørgrav 	c->tcp_parent = NULL;
4034b7579f77SDag-Erling Smørgrav 	c->max_tcp_count = 0;
403509a3aaf3SDag-Erling Smørgrav 	c->cur_tcp_count = 0;
4036b7579f77SDag-Erling Smørgrav 	c->tcp_handlers = NULL;
4037b7579f77SDag-Erling Smørgrav 	c->tcp_free = NULL;
4038b7579f77SDag-Erling Smørgrav 	c->type = comm_udp;
4039b7579f77SDag-Erling Smørgrav 	c->tcp_do_close = 0;
4040b7579f77SDag-Erling Smørgrav 	c->do_not_close = 0;
404165b390aaSDag-Erling Smørgrav #ifdef USE_DNSCRYPT
404265b390aaSDag-Erling Smørgrav 	c->dnscrypt = 0;
404365b390aaSDag-Erling Smørgrav 	c->dnscrypt_buffer = buffer;
404465b390aaSDag-Erling Smørgrav #endif
4045b7579f77SDag-Erling Smørgrav 	c->inuse = 0;
4046b7579f77SDag-Erling Smørgrav 	c->tcp_do_toggle_rw = 0;
4047b7579f77SDag-Erling Smørgrav 	c->tcp_check_nb_connect = 0;
4048b5663de9SDag-Erling Smørgrav #ifdef USE_MSG_FASTOPEN
4049b5663de9SDag-Erling Smørgrav 	c->tcp_do_fastopen = 0;
4050b5663de9SDag-Erling Smørgrav #endif
4051b7579f77SDag-Erling Smørgrav 	c->callback = callback;
4052b7579f77SDag-Erling Smørgrav 	c->cb_arg = callback_arg;
40535469a995SCy Schubert 	c->socket = socket;
4054865f46b2SCy Schubert 	c->pp2_enabled = pp2_enabled;
4055865f46b2SCy Schubert 	c->pp2_header_state = pp2_header_none;
4056e2d15004SDag-Erling Smørgrav 	evbits = UB_EV_READ | UB_EV_PERSIST;
4057e2d15004SDag-Erling Smørgrav 	/* ub_event stuff */
4058e2d15004SDag-Erling Smørgrav 	c->ev->ev = ub_event_new(base->eb->base, c->fd, evbits,
4059e2d15004SDag-Erling Smørgrav 		comm_point_udp_ancil_callback, c);
4060e2d15004SDag-Erling Smørgrav 	if(c->ev->ev == NULL) {
4061b7579f77SDag-Erling Smørgrav 		log_err("could not baseset udp event");
4062b7579f77SDag-Erling Smørgrav 		comm_point_delete(c);
4063b7579f77SDag-Erling Smørgrav 		return NULL;
4064b7579f77SDag-Erling Smørgrav 	}
4065e2d15004SDag-Erling Smørgrav 	if(fd!=-1 && ub_event_add(c->ev->ev, c->timeout) != 0 ) {
4066b7579f77SDag-Erling Smørgrav 		log_err("could not add udp event");
4067b7579f77SDag-Erling Smørgrav 		comm_point_delete(c);
4068b7579f77SDag-Erling Smørgrav 		return NULL;
4069b7579f77SDag-Erling Smørgrav 	}
4070f44e67d1SCy Schubert 	c->event_added = 1;
4071b7579f77SDag-Erling Smørgrav 	return c;
4072b7579f77SDag-Erling Smørgrav }
4073103ba509SCy Schubert #endif
4074b7579f77SDag-Erling Smørgrav 
4075b7579f77SDag-Erling Smørgrav static struct comm_point*
4076b7579f77SDag-Erling Smørgrav comm_point_create_tcp_handler(struct comm_base *base,
4077b7579f77SDag-Erling Smørgrav 	struct comm_point* parent, size_t bufsize,
4078e86b9096SDag-Erling Smørgrav 	struct sldns_buffer* spoolbuf, comm_point_callback_type* callback,
40795469a995SCy Schubert 	void* callback_arg, struct unbound_socket* socket)
4080b7579f77SDag-Erling Smørgrav {
4081b7579f77SDag-Erling Smørgrav 	struct comm_point* c = (struct comm_point*)calloc(1,
4082b7579f77SDag-Erling Smørgrav 		sizeof(struct comm_point));
4083b7579f77SDag-Erling Smørgrav 	short evbits;
4084b7579f77SDag-Erling Smørgrav 	if(!c)
4085b7579f77SDag-Erling Smørgrav 		return NULL;
4086b7579f77SDag-Erling Smørgrav 	c->ev = (struct internal_event*)calloc(1,
4087b7579f77SDag-Erling Smørgrav 		sizeof(struct internal_event));
4088b7579f77SDag-Erling Smørgrav 	if(!c->ev) {
4089b7579f77SDag-Erling Smørgrav 		free(c);
4090b7579f77SDag-Erling Smørgrav 		return NULL;
4091b7579f77SDag-Erling Smørgrav 	}
4092b7579f77SDag-Erling Smørgrav 	c->ev->base = base;
4093b7579f77SDag-Erling Smørgrav 	c->fd = -1;
409417d15b25SDag-Erling Smørgrav 	c->buffer = sldns_buffer_new(bufsize);
4095b7579f77SDag-Erling Smørgrav 	if(!c->buffer) {
4096b7579f77SDag-Erling Smørgrav 		free(c->ev);
4097b7579f77SDag-Erling Smørgrav 		free(c);
4098b7579f77SDag-Erling Smørgrav 		return NULL;
4099b7579f77SDag-Erling Smørgrav 	}
4100b7579f77SDag-Erling Smørgrav 	c->timeout = (struct timeval*)malloc(sizeof(struct timeval));
4101b7579f77SDag-Erling Smørgrav 	if(!c->timeout) {
410217d15b25SDag-Erling Smørgrav 		sldns_buffer_free(c->buffer);
4103b7579f77SDag-Erling Smørgrav 		free(c->ev);
4104b7579f77SDag-Erling Smørgrav 		free(c);
4105b7579f77SDag-Erling Smørgrav 		return NULL;
4106b7579f77SDag-Erling Smørgrav 	}
4107b7579f77SDag-Erling Smørgrav 	c->tcp_is_reading = 0;
4108b7579f77SDag-Erling Smørgrav 	c->tcp_byte_count = 0;
4109b7579f77SDag-Erling Smørgrav 	c->tcp_parent = parent;
41104c75e3aaSDag-Erling Smørgrav 	c->tcp_timeout_msec = parent->tcp_timeout_msec;
41114c75e3aaSDag-Erling Smørgrav 	c->tcp_conn_limit = parent->tcp_conn_limit;
41124c75e3aaSDag-Erling Smørgrav 	c->tcl_addr = NULL;
41134c75e3aaSDag-Erling Smørgrav 	c->tcp_keepalive = 0;
4114b7579f77SDag-Erling Smørgrav 	c->max_tcp_count = 0;
411509a3aaf3SDag-Erling Smørgrav 	c->cur_tcp_count = 0;
4116b7579f77SDag-Erling Smørgrav 	c->tcp_handlers = NULL;
4117b7579f77SDag-Erling Smørgrav 	c->tcp_free = NULL;
4118b7579f77SDag-Erling Smørgrav 	c->type = comm_tcp;
4119b7579f77SDag-Erling Smørgrav 	c->tcp_do_close = 0;
4120b7579f77SDag-Erling Smørgrav 	c->do_not_close = 0;
4121b7579f77SDag-Erling Smørgrav 	c->tcp_do_toggle_rw = 1;
4122b7579f77SDag-Erling Smørgrav 	c->tcp_check_nb_connect = 0;
4123b5663de9SDag-Erling Smørgrav #ifdef USE_MSG_FASTOPEN
4124b5663de9SDag-Erling Smørgrav 	c->tcp_do_fastopen = 0;
4125b5663de9SDag-Erling Smørgrav #endif
412665b390aaSDag-Erling Smørgrav #ifdef USE_DNSCRYPT
412765b390aaSDag-Erling Smørgrav 	c->dnscrypt = 0;
4128c7f4d7adSDag-Erling Smørgrav 	/* We don't know just yet if this is a dnscrypt channel. Allocation
4129c7f4d7adSDag-Erling Smørgrav 	 * will be done when handling the callback. */
413065b390aaSDag-Erling Smørgrav 	c->dnscrypt_buffer = c->buffer;
413165b390aaSDag-Erling Smørgrav #endif
4132b7579f77SDag-Erling Smørgrav 	c->repinfo.c = c;
4133b7579f77SDag-Erling Smørgrav 	c->callback = callback;
4134b7579f77SDag-Erling Smørgrav 	c->cb_arg = callback_arg;
41355469a995SCy Schubert 	c->socket = socket;
4136865f46b2SCy Schubert 	c->pp2_enabled = parent->pp2_enabled;
4137865f46b2SCy Schubert 	c->pp2_header_state = pp2_header_none;
4138e86b9096SDag-Erling Smørgrav 	if(spoolbuf) {
4139e86b9096SDag-Erling Smørgrav 		c->tcp_req_info = tcp_req_info_create(spoolbuf);
4140e86b9096SDag-Erling Smørgrav 		if(!c->tcp_req_info) {
4141e86b9096SDag-Erling Smørgrav 			log_err("could not create tcp commpoint");
4142e86b9096SDag-Erling Smørgrav 			sldns_buffer_free(c->buffer);
4143e86b9096SDag-Erling Smørgrav 			free(c->timeout);
4144e86b9096SDag-Erling Smørgrav 			free(c->ev);
4145e86b9096SDag-Erling Smørgrav 			free(c);
4146e86b9096SDag-Erling Smørgrav 			return NULL;
4147e86b9096SDag-Erling Smørgrav 		}
4148e86b9096SDag-Erling Smørgrav 		c->tcp_req_info->cp = c;
4149e86b9096SDag-Erling Smørgrav 		c->tcp_do_close = 1;
4150e86b9096SDag-Erling Smørgrav 		c->tcp_do_toggle_rw = 0;
4151e86b9096SDag-Erling Smørgrav 	}
4152b7579f77SDag-Erling Smørgrav 	/* add to parent free list */
4153b7579f77SDag-Erling Smørgrav 	c->tcp_free = parent->tcp_free;
4154b7579f77SDag-Erling Smørgrav 	parent->tcp_free = c;
4155e2d15004SDag-Erling Smørgrav 	/* ub_event stuff */
4156e2d15004SDag-Erling Smørgrav 	evbits = UB_EV_PERSIST | UB_EV_READ | UB_EV_TIMEOUT;
4157e2d15004SDag-Erling Smørgrav 	c->ev->ev = ub_event_new(base->eb->base, c->fd, evbits,
4158e2d15004SDag-Erling Smørgrav 		comm_point_tcp_handle_callback, c);
4159e2d15004SDag-Erling Smørgrav 	if(c->ev->ev == NULL)
4160b7579f77SDag-Erling Smørgrav 	{
4161b7579f77SDag-Erling Smørgrav 		log_err("could not basetset tcphdl event");
4162b7579f77SDag-Erling Smørgrav 		parent->tcp_free = c->tcp_free;
4163e86b9096SDag-Erling Smørgrav 		tcp_req_info_delete(c->tcp_req_info);
4164e86b9096SDag-Erling Smørgrav 		sldns_buffer_free(c->buffer);
4165e86b9096SDag-Erling Smørgrav 		free(c->timeout);
4166b7579f77SDag-Erling Smørgrav 		free(c->ev);
4167b7579f77SDag-Erling Smørgrav 		free(c);
4168b7579f77SDag-Erling Smørgrav 		return NULL;
4169b7579f77SDag-Erling Smørgrav 	}
4170b7579f77SDag-Erling Smørgrav 	return c;
4171b7579f77SDag-Erling Smørgrav }
4172b7579f77SDag-Erling Smørgrav 
4173c0caa2e2SCy Schubert static struct comm_point*
4174c0caa2e2SCy Schubert comm_point_create_http_handler(struct comm_base *base,
4175c0caa2e2SCy Schubert 	struct comm_point* parent, size_t bufsize, int harden_large_queries,
4176c0caa2e2SCy Schubert 	uint32_t http_max_streams, char* http_endpoint,
41775469a995SCy Schubert 	comm_point_callback_type* callback, void* callback_arg,
41785469a995SCy Schubert 	struct unbound_socket* socket)
4179c0caa2e2SCy Schubert {
4180c0caa2e2SCy Schubert 	struct comm_point* c = (struct comm_point*)calloc(1,
4181c0caa2e2SCy Schubert 		sizeof(struct comm_point));
4182c0caa2e2SCy Schubert 	short evbits;
4183c0caa2e2SCy Schubert 	if(!c)
4184c0caa2e2SCy Schubert 		return NULL;
4185c0caa2e2SCy Schubert 	c->ev = (struct internal_event*)calloc(1,
4186c0caa2e2SCy Schubert 		sizeof(struct internal_event));
4187c0caa2e2SCy Schubert 	if(!c->ev) {
4188c0caa2e2SCy Schubert 		free(c);
4189c0caa2e2SCy Schubert 		return NULL;
4190c0caa2e2SCy Schubert 	}
4191c0caa2e2SCy Schubert 	c->ev->base = base;
4192c0caa2e2SCy Schubert 	c->fd = -1;
4193c0caa2e2SCy Schubert 	c->buffer = sldns_buffer_new(bufsize);
4194c0caa2e2SCy Schubert 	if(!c->buffer) {
4195c0caa2e2SCy Schubert 		free(c->ev);
4196c0caa2e2SCy Schubert 		free(c);
4197c0caa2e2SCy Schubert 		return NULL;
4198c0caa2e2SCy Schubert 	}
4199c0caa2e2SCy Schubert 	c->timeout = (struct timeval*)malloc(sizeof(struct timeval));
4200c0caa2e2SCy Schubert 	if(!c->timeout) {
4201c0caa2e2SCy Schubert 		sldns_buffer_free(c->buffer);
4202c0caa2e2SCy Schubert 		free(c->ev);
4203c0caa2e2SCy Schubert 		free(c);
4204c0caa2e2SCy Schubert 		return NULL;
4205c0caa2e2SCy Schubert 	}
4206c0caa2e2SCy Schubert 	c->tcp_is_reading = 0;
4207c0caa2e2SCy Schubert 	c->tcp_byte_count = 0;
4208c0caa2e2SCy Schubert 	c->tcp_parent = parent;
4209c0caa2e2SCy Schubert 	c->tcp_timeout_msec = parent->tcp_timeout_msec;
4210c0caa2e2SCy Schubert 	c->tcp_conn_limit = parent->tcp_conn_limit;
4211c0caa2e2SCy Schubert 	c->tcl_addr = NULL;
4212c0caa2e2SCy Schubert 	c->tcp_keepalive = 0;
4213c0caa2e2SCy Schubert 	c->max_tcp_count = 0;
4214c0caa2e2SCy Schubert 	c->cur_tcp_count = 0;
4215c0caa2e2SCy Schubert 	c->tcp_handlers = NULL;
4216c0caa2e2SCy Schubert 	c->tcp_free = NULL;
4217c0caa2e2SCy Schubert 	c->type = comm_http;
4218c0caa2e2SCy Schubert 	c->tcp_do_close = 1;
4219c0caa2e2SCy Schubert 	c->do_not_close = 0;
4220c0caa2e2SCy Schubert 	c->tcp_do_toggle_rw = 1; /* will be set to 0 after http2 upgrade */
4221c0caa2e2SCy Schubert 	c->tcp_check_nb_connect = 0;
4222c0caa2e2SCy Schubert #ifdef USE_MSG_FASTOPEN
4223c0caa2e2SCy Schubert 	c->tcp_do_fastopen = 0;
4224c0caa2e2SCy Schubert #endif
4225c0caa2e2SCy Schubert #ifdef USE_DNSCRYPT
4226c0caa2e2SCy Schubert 	c->dnscrypt = 0;
4227c0caa2e2SCy Schubert 	c->dnscrypt_buffer = NULL;
4228c0caa2e2SCy Schubert #endif
4229c0caa2e2SCy Schubert 	c->repinfo.c = c;
4230c0caa2e2SCy Schubert 	c->callback = callback;
4231c0caa2e2SCy Schubert 	c->cb_arg = callback_arg;
42325469a995SCy Schubert 	c->socket = socket;
4233865f46b2SCy Schubert 	c->pp2_enabled = 0;
4234865f46b2SCy Schubert 	c->pp2_header_state = pp2_header_none;
4235c0caa2e2SCy Schubert 
4236c0caa2e2SCy Schubert 	c->http_min_version = http_version_2;
4237c0caa2e2SCy Schubert 	c->http2_stream_max_qbuffer_size = bufsize;
4238c0caa2e2SCy Schubert 	if(harden_large_queries && bufsize > 512)
4239c0caa2e2SCy Schubert 		c->http2_stream_max_qbuffer_size = 512;
4240c0caa2e2SCy Schubert 	c->http2_max_streams = http_max_streams;
4241c0caa2e2SCy Schubert 	if(!(c->http_endpoint = strdup(http_endpoint))) {
4242c0caa2e2SCy Schubert 		log_err("could not strdup http_endpoint");
4243c0caa2e2SCy Schubert 		sldns_buffer_free(c->buffer);
4244c0caa2e2SCy Schubert 		free(c->timeout);
4245c0caa2e2SCy Schubert 		free(c->ev);
4246c0caa2e2SCy Schubert 		free(c);
4247c0caa2e2SCy Schubert 		return NULL;
4248c0caa2e2SCy Schubert 	}
4249c0caa2e2SCy Schubert 	c->use_h2 = 0;
4250c0caa2e2SCy Schubert #ifdef HAVE_NGHTTP2
4251c0caa2e2SCy Schubert 	if(!(c->h2_session = http2_session_create(c))) {
4252c0caa2e2SCy Schubert 		log_err("could not create http2 session");
4253c0caa2e2SCy Schubert 		free(c->http_endpoint);
4254c0caa2e2SCy Schubert 		sldns_buffer_free(c->buffer);
4255c0caa2e2SCy Schubert 		free(c->timeout);
4256c0caa2e2SCy Schubert 		free(c->ev);
4257c0caa2e2SCy Schubert 		free(c);
4258c0caa2e2SCy Schubert 		return NULL;
4259c0caa2e2SCy Schubert 	}
4260c0caa2e2SCy Schubert 	if(!(c->h2_session->callbacks = http2_req_callbacks_create())) {
4261c0caa2e2SCy Schubert 		log_err("could not create http2 callbacks");
4262c0caa2e2SCy Schubert 		http2_session_delete(c->h2_session);
4263c0caa2e2SCy Schubert 		free(c->http_endpoint);
4264c0caa2e2SCy Schubert 		sldns_buffer_free(c->buffer);
4265c0caa2e2SCy Schubert 		free(c->timeout);
4266c0caa2e2SCy Schubert 		free(c->ev);
4267c0caa2e2SCy Schubert 		free(c);
4268c0caa2e2SCy Schubert 		return NULL;
4269c0caa2e2SCy Schubert 	}
4270c0caa2e2SCy Schubert #endif
4271c0caa2e2SCy Schubert 
4272c0caa2e2SCy Schubert 	/* add to parent free list */
4273c0caa2e2SCy Schubert 	c->tcp_free = parent->tcp_free;
4274c0caa2e2SCy Schubert 	parent->tcp_free = c;
4275c0caa2e2SCy Schubert 	/* ub_event stuff */
4276c0caa2e2SCy Schubert 	evbits = UB_EV_PERSIST | UB_EV_READ | UB_EV_TIMEOUT;
4277c0caa2e2SCy Schubert 	c->ev->ev = ub_event_new(base->eb->base, c->fd, evbits,
4278c0caa2e2SCy Schubert 		comm_point_http_handle_callback, c);
4279c0caa2e2SCy Schubert 	if(c->ev->ev == NULL)
4280c0caa2e2SCy Schubert 	{
4281c0caa2e2SCy Schubert 		log_err("could not set http handler event");
4282c0caa2e2SCy Schubert 		parent->tcp_free = c->tcp_free;
4283c0caa2e2SCy Schubert 		http2_session_delete(c->h2_session);
4284c0caa2e2SCy Schubert 		sldns_buffer_free(c->buffer);
4285c0caa2e2SCy Schubert 		free(c->timeout);
4286c0caa2e2SCy Schubert 		free(c->ev);
4287c0caa2e2SCy Schubert 		free(c);
4288c0caa2e2SCy Schubert 		return NULL;
4289c0caa2e2SCy Schubert 	}
4290c0caa2e2SCy Schubert 	return c;
4291c0caa2e2SCy Schubert }
4292c0caa2e2SCy Schubert 
4293b7579f77SDag-Erling Smørgrav struct comm_point*
42944c75e3aaSDag-Erling Smørgrav comm_point_create_tcp(struct comm_base *base, int fd, int num,
4295c0caa2e2SCy Schubert 	int idle_timeout, int harden_large_queries,
4296c0caa2e2SCy Schubert 	uint32_t http_max_streams, char* http_endpoint,
4297c0caa2e2SCy Schubert 	struct tcl_list* tcp_conn_limit, size_t bufsize,
4298c0caa2e2SCy Schubert 	struct sldns_buffer* spoolbuf, enum listen_type port_type,
4299865f46b2SCy Schubert 	int pp2_enabled, comm_point_callback_type* callback,
4300865f46b2SCy Schubert 	void* callback_arg, struct unbound_socket* socket)
4301b7579f77SDag-Erling Smørgrav {
4302b7579f77SDag-Erling Smørgrav 	struct comm_point* c = (struct comm_point*)calloc(1,
4303b7579f77SDag-Erling Smørgrav 		sizeof(struct comm_point));
4304b7579f77SDag-Erling Smørgrav 	short evbits;
4305b7579f77SDag-Erling Smørgrav 	int i;
4306b7579f77SDag-Erling Smørgrav 	/* first allocate the TCP accept listener */
4307b7579f77SDag-Erling Smørgrav 	if(!c)
4308b7579f77SDag-Erling Smørgrav 		return NULL;
4309b7579f77SDag-Erling Smørgrav 	c->ev = (struct internal_event*)calloc(1,
4310b7579f77SDag-Erling Smørgrav 		sizeof(struct internal_event));
4311b7579f77SDag-Erling Smørgrav 	if(!c->ev) {
4312b7579f77SDag-Erling Smørgrav 		free(c);
4313b7579f77SDag-Erling Smørgrav 		return NULL;
4314b7579f77SDag-Erling Smørgrav 	}
4315b7579f77SDag-Erling Smørgrav 	c->ev->base = base;
4316b7579f77SDag-Erling Smørgrav 	c->fd = fd;
4317b7579f77SDag-Erling Smørgrav 	c->buffer = NULL;
4318b7579f77SDag-Erling Smørgrav 	c->timeout = NULL;
4319b7579f77SDag-Erling Smørgrav 	c->tcp_is_reading = 0;
4320b7579f77SDag-Erling Smørgrav 	c->tcp_byte_count = 0;
43214c75e3aaSDag-Erling Smørgrav 	c->tcp_timeout_msec = idle_timeout;
43224c75e3aaSDag-Erling Smørgrav 	c->tcp_conn_limit = tcp_conn_limit;
43234c75e3aaSDag-Erling Smørgrav 	c->tcl_addr = NULL;
43244c75e3aaSDag-Erling Smørgrav 	c->tcp_keepalive = 0;
4325b7579f77SDag-Erling Smørgrav 	c->tcp_parent = NULL;
4326b7579f77SDag-Erling Smørgrav 	c->max_tcp_count = num;
432709a3aaf3SDag-Erling Smørgrav 	c->cur_tcp_count = 0;
4328b7579f77SDag-Erling Smørgrav 	c->tcp_handlers = (struct comm_point**)calloc((size_t)num,
4329b7579f77SDag-Erling Smørgrav 		sizeof(struct comm_point*));
4330b7579f77SDag-Erling Smørgrav 	if(!c->tcp_handlers) {
4331b7579f77SDag-Erling Smørgrav 		free(c->ev);
4332b7579f77SDag-Erling Smørgrav 		free(c);
4333b7579f77SDag-Erling Smørgrav 		return NULL;
4334b7579f77SDag-Erling Smørgrav 	}
4335b7579f77SDag-Erling Smørgrav 	c->tcp_free = NULL;
4336b7579f77SDag-Erling Smørgrav 	c->type = comm_tcp_accept;
4337b7579f77SDag-Erling Smørgrav 	c->tcp_do_close = 0;
4338b7579f77SDag-Erling Smørgrav 	c->do_not_close = 0;
4339b7579f77SDag-Erling Smørgrav 	c->tcp_do_toggle_rw = 0;
4340b7579f77SDag-Erling Smørgrav 	c->tcp_check_nb_connect = 0;
4341b5663de9SDag-Erling Smørgrav #ifdef USE_MSG_FASTOPEN
4342b5663de9SDag-Erling Smørgrav 	c->tcp_do_fastopen = 0;
4343b5663de9SDag-Erling Smørgrav #endif
434465b390aaSDag-Erling Smørgrav #ifdef USE_DNSCRYPT
434565b390aaSDag-Erling Smørgrav 	c->dnscrypt = 0;
434665b390aaSDag-Erling Smørgrav 	c->dnscrypt_buffer = NULL;
434765b390aaSDag-Erling Smørgrav #endif
4348b7579f77SDag-Erling Smørgrav 	c->callback = NULL;
4349b7579f77SDag-Erling Smørgrav 	c->cb_arg = NULL;
43505469a995SCy Schubert 	c->socket = socket;
4351865f46b2SCy Schubert 	c->pp2_enabled = (port_type==listen_type_http?0:pp2_enabled);
4352865f46b2SCy Schubert 	c->pp2_header_state = pp2_header_none;
4353e2d15004SDag-Erling Smørgrav 	evbits = UB_EV_READ | UB_EV_PERSIST;
4354e2d15004SDag-Erling Smørgrav 	/* ub_event stuff */
4355e2d15004SDag-Erling Smørgrav 	c->ev->ev = ub_event_new(base->eb->base, c->fd, evbits,
4356e2d15004SDag-Erling Smørgrav 		comm_point_tcp_accept_callback, c);
4357e2d15004SDag-Erling Smørgrav 	if(c->ev->ev == NULL) {
4358e2d15004SDag-Erling Smørgrav 		log_err("could not baseset tcpacc event");
4359e2d15004SDag-Erling Smørgrav 		comm_point_delete(c);
4360e2d15004SDag-Erling Smørgrav 		return NULL;
4361e2d15004SDag-Erling Smørgrav 	}
4362e2d15004SDag-Erling Smørgrav 	if (ub_event_add(c->ev->ev, c->timeout) != 0) {
4363b7579f77SDag-Erling Smørgrav 		log_err("could not add tcpacc event");
4364b7579f77SDag-Erling Smørgrav 		comm_point_delete(c);
4365b7579f77SDag-Erling Smørgrav 		return NULL;
4366b7579f77SDag-Erling Smørgrav 	}
4367f44e67d1SCy Schubert 	c->event_added = 1;
4368c0caa2e2SCy Schubert 	/* now prealloc the handlers */
4369b7579f77SDag-Erling Smørgrav 	for(i=0; i<num; i++) {
4370c0caa2e2SCy Schubert 		if(port_type == listen_type_tcp ||
4371c0caa2e2SCy Schubert 			port_type == listen_type_ssl ||
4372c0caa2e2SCy Schubert 			port_type == listen_type_tcp_dnscrypt) {
4373b7579f77SDag-Erling Smørgrav 			c->tcp_handlers[i] = comm_point_create_tcp_handler(base,
43745469a995SCy Schubert 				c, bufsize, spoolbuf, callback, callback_arg, socket);
4375c0caa2e2SCy Schubert 		} else if(port_type == listen_type_http) {
4376c0caa2e2SCy Schubert 			c->tcp_handlers[i] = comm_point_create_http_handler(
4377c0caa2e2SCy Schubert 				base, c, bufsize, harden_large_queries,
4378c0caa2e2SCy Schubert 				http_max_streams, http_endpoint,
43795469a995SCy Schubert 				callback, callback_arg, socket);
4380c0caa2e2SCy Schubert 		}
4381c0caa2e2SCy Schubert 		else {
4382c0caa2e2SCy Schubert 			log_err("could not create tcp handler, unknown listen "
4383c0caa2e2SCy Schubert 				"type");
4384c0caa2e2SCy Schubert 			return NULL;
4385c0caa2e2SCy Schubert 		}
4386b7579f77SDag-Erling Smørgrav 		if(!c->tcp_handlers[i]) {
4387b7579f77SDag-Erling Smørgrav 			comm_point_delete(c);
4388b7579f77SDag-Erling Smørgrav 			return NULL;
4389b7579f77SDag-Erling Smørgrav 		}
4390b7579f77SDag-Erling Smørgrav 	}
4391b7579f77SDag-Erling Smørgrav 
4392b7579f77SDag-Erling Smørgrav 	return c;
4393b7579f77SDag-Erling Smørgrav }
4394b7579f77SDag-Erling Smørgrav 
4395b7579f77SDag-Erling Smørgrav struct comm_point*
4396b7579f77SDag-Erling Smørgrav comm_point_create_tcp_out(struct comm_base *base, size_t bufsize,
43973005e0a3SDag-Erling Smørgrav         comm_point_callback_type* callback, void* callback_arg)
4398b7579f77SDag-Erling Smørgrav {
4399b7579f77SDag-Erling Smørgrav 	struct comm_point* c = (struct comm_point*)calloc(1,
4400b7579f77SDag-Erling Smørgrav 		sizeof(struct comm_point));
4401b7579f77SDag-Erling Smørgrav 	short evbits;
4402b7579f77SDag-Erling Smørgrav 	if(!c)
4403b7579f77SDag-Erling Smørgrav 		return NULL;
4404b7579f77SDag-Erling Smørgrav 	c->ev = (struct internal_event*)calloc(1,
4405b7579f77SDag-Erling Smørgrav 		sizeof(struct internal_event));
4406b7579f77SDag-Erling Smørgrav 	if(!c->ev) {
4407b7579f77SDag-Erling Smørgrav 		free(c);
4408b7579f77SDag-Erling Smørgrav 		return NULL;
4409b7579f77SDag-Erling Smørgrav 	}
4410b7579f77SDag-Erling Smørgrav 	c->ev->base = base;
4411b7579f77SDag-Erling Smørgrav 	c->fd = -1;
441217d15b25SDag-Erling Smørgrav 	c->buffer = sldns_buffer_new(bufsize);
4413b7579f77SDag-Erling Smørgrav 	if(!c->buffer) {
4414b7579f77SDag-Erling Smørgrav 		free(c->ev);
4415b7579f77SDag-Erling Smørgrav 		free(c);
4416b7579f77SDag-Erling Smørgrav 		return NULL;
4417b7579f77SDag-Erling Smørgrav 	}
4418b7579f77SDag-Erling Smørgrav 	c->timeout = NULL;
4419b7579f77SDag-Erling Smørgrav 	c->tcp_is_reading = 0;
4420b7579f77SDag-Erling Smørgrav 	c->tcp_byte_count = 0;
44214c75e3aaSDag-Erling Smørgrav 	c->tcp_timeout_msec = TCP_QUERY_TIMEOUT;
44224c75e3aaSDag-Erling Smørgrav 	c->tcp_conn_limit = NULL;
44234c75e3aaSDag-Erling Smørgrav 	c->tcl_addr = NULL;
44244c75e3aaSDag-Erling Smørgrav 	c->tcp_keepalive = 0;
4425b7579f77SDag-Erling Smørgrav 	c->tcp_parent = NULL;
4426b7579f77SDag-Erling Smørgrav 	c->max_tcp_count = 0;
442709a3aaf3SDag-Erling Smørgrav 	c->cur_tcp_count = 0;
4428b7579f77SDag-Erling Smørgrav 	c->tcp_handlers = NULL;
4429b7579f77SDag-Erling Smørgrav 	c->tcp_free = NULL;
4430b7579f77SDag-Erling Smørgrav 	c->type = comm_tcp;
4431b7579f77SDag-Erling Smørgrav 	c->tcp_do_close = 0;
4432b7579f77SDag-Erling Smørgrav 	c->do_not_close = 0;
4433b7579f77SDag-Erling Smørgrav 	c->tcp_do_toggle_rw = 1;
4434b7579f77SDag-Erling Smørgrav 	c->tcp_check_nb_connect = 1;
4435b5663de9SDag-Erling Smørgrav #ifdef USE_MSG_FASTOPEN
4436b5663de9SDag-Erling Smørgrav 	c->tcp_do_fastopen = 1;
4437b5663de9SDag-Erling Smørgrav #endif
443865b390aaSDag-Erling Smørgrav #ifdef USE_DNSCRYPT
443965b390aaSDag-Erling Smørgrav 	c->dnscrypt = 0;
444065b390aaSDag-Erling Smørgrav 	c->dnscrypt_buffer = c->buffer;
444165b390aaSDag-Erling Smørgrav #endif
4442b7579f77SDag-Erling Smørgrav 	c->repinfo.c = c;
4443b7579f77SDag-Erling Smørgrav 	c->callback = callback;
4444b7579f77SDag-Erling Smørgrav 	c->cb_arg = callback_arg;
4445865f46b2SCy Schubert 	c->pp2_enabled = 0;
4446865f46b2SCy Schubert 	c->pp2_header_state = pp2_header_none;
4447e2d15004SDag-Erling Smørgrav 	evbits = UB_EV_PERSIST | UB_EV_WRITE;
4448e2d15004SDag-Erling Smørgrav 	c->ev->ev = ub_event_new(base->eb->base, c->fd, evbits,
4449e2d15004SDag-Erling Smørgrav 		comm_point_tcp_handle_callback, c);
4450e2d15004SDag-Erling Smørgrav 	if(c->ev->ev == NULL)
4451b7579f77SDag-Erling Smørgrav 	{
4452e2d15004SDag-Erling Smørgrav 		log_err("could not baseset tcpout event");
445317d15b25SDag-Erling Smørgrav 		sldns_buffer_free(c->buffer);
4454b7579f77SDag-Erling Smørgrav 		free(c->ev);
4455b7579f77SDag-Erling Smørgrav 		free(c);
4456b7579f77SDag-Erling Smørgrav 		return NULL;
4457b7579f77SDag-Erling Smørgrav 	}
4458b7579f77SDag-Erling Smørgrav 
4459b7579f77SDag-Erling Smørgrav 	return c;
4460b7579f77SDag-Erling Smørgrav }
4461b7579f77SDag-Erling Smørgrav 
4462b7579f77SDag-Erling Smørgrav struct comm_point*
446357bddd21SDag-Erling Smørgrav comm_point_create_http_out(struct comm_base *base, size_t bufsize,
446457bddd21SDag-Erling Smørgrav         comm_point_callback_type* callback, void* callback_arg,
446557bddd21SDag-Erling Smørgrav 	sldns_buffer* temp)
446657bddd21SDag-Erling Smørgrav {
446757bddd21SDag-Erling Smørgrav 	struct comm_point* c = (struct comm_point*)calloc(1,
446857bddd21SDag-Erling Smørgrav 		sizeof(struct comm_point));
446957bddd21SDag-Erling Smørgrav 	short evbits;
447057bddd21SDag-Erling Smørgrav 	if(!c)
447157bddd21SDag-Erling Smørgrav 		return NULL;
447257bddd21SDag-Erling Smørgrav 	c->ev = (struct internal_event*)calloc(1,
447357bddd21SDag-Erling Smørgrav 		sizeof(struct internal_event));
447457bddd21SDag-Erling Smørgrav 	if(!c->ev) {
447557bddd21SDag-Erling Smørgrav 		free(c);
447657bddd21SDag-Erling Smørgrav 		return NULL;
447757bddd21SDag-Erling Smørgrav 	}
447857bddd21SDag-Erling Smørgrav 	c->ev->base = base;
447957bddd21SDag-Erling Smørgrav 	c->fd = -1;
448057bddd21SDag-Erling Smørgrav 	c->buffer = sldns_buffer_new(bufsize);
448157bddd21SDag-Erling Smørgrav 	if(!c->buffer) {
448257bddd21SDag-Erling Smørgrav 		free(c->ev);
448357bddd21SDag-Erling Smørgrav 		free(c);
448457bddd21SDag-Erling Smørgrav 		return NULL;
448557bddd21SDag-Erling Smørgrav 	}
448657bddd21SDag-Erling Smørgrav 	c->timeout = NULL;
448757bddd21SDag-Erling Smørgrav 	c->tcp_is_reading = 0;
448857bddd21SDag-Erling Smørgrav 	c->tcp_byte_count = 0;
448957bddd21SDag-Erling Smørgrav 	c->tcp_parent = NULL;
449057bddd21SDag-Erling Smørgrav 	c->max_tcp_count = 0;
449157bddd21SDag-Erling Smørgrav 	c->cur_tcp_count = 0;
449257bddd21SDag-Erling Smørgrav 	c->tcp_handlers = NULL;
449357bddd21SDag-Erling Smørgrav 	c->tcp_free = NULL;
449457bddd21SDag-Erling Smørgrav 	c->type = comm_http;
449557bddd21SDag-Erling Smørgrav 	c->tcp_do_close = 0;
449657bddd21SDag-Erling Smørgrav 	c->do_not_close = 0;
449757bddd21SDag-Erling Smørgrav 	c->tcp_do_toggle_rw = 1;
449857bddd21SDag-Erling Smørgrav 	c->tcp_check_nb_connect = 1;
449957bddd21SDag-Erling Smørgrav 	c->http_in_headers = 1;
450057bddd21SDag-Erling Smørgrav 	c->http_in_chunk_headers = 0;
450157bddd21SDag-Erling Smørgrav 	c->http_is_chunked = 0;
450257bddd21SDag-Erling Smørgrav 	c->http_temp = temp;
450357bddd21SDag-Erling Smørgrav #ifdef USE_MSG_FASTOPEN
450457bddd21SDag-Erling Smørgrav 	c->tcp_do_fastopen = 1;
450557bddd21SDag-Erling Smørgrav #endif
450657bddd21SDag-Erling Smørgrav #ifdef USE_DNSCRYPT
450757bddd21SDag-Erling Smørgrav 	c->dnscrypt = 0;
450857bddd21SDag-Erling Smørgrav 	c->dnscrypt_buffer = c->buffer;
450957bddd21SDag-Erling Smørgrav #endif
451057bddd21SDag-Erling Smørgrav 	c->repinfo.c = c;
451157bddd21SDag-Erling Smørgrav 	c->callback = callback;
451257bddd21SDag-Erling Smørgrav 	c->cb_arg = callback_arg;
4513865f46b2SCy Schubert 	c->pp2_enabled = 0;
4514865f46b2SCy Schubert 	c->pp2_header_state = pp2_header_none;
451557bddd21SDag-Erling Smørgrav 	evbits = UB_EV_PERSIST | UB_EV_WRITE;
451657bddd21SDag-Erling Smørgrav 	c->ev->ev = ub_event_new(base->eb->base, c->fd, evbits,
451757bddd21SDag-Erling Smørgrav 		comm_point_http_handle_callback, c);
451857bddd21SDag-Erling Smørgrav 	if(c->ev->ev == NULL)
451957bddd21SDag-Erling Smørgrav 	{
452057bddd21SDag-Erling Smørgrav 		log_err("could not baseset tcpout event");
452157bddd21SDag-Erling Smørgrav #ifdef HAVE_SSL
452257bddd21SDag-Erling Smørgrav 		SSL_free(c->ssl);
452357bddd21SDag-Erling Smørgrav #endif
452457bddd21SDag-Erling Smørgrav 		sldns_buffer_free(c->buffer);
452557bddd21SDag-Erling Smørgrav 		free(c->ev);
452657bddd21SDag-Erling Smørgrav 		free(c);
452757bddd21SDag-Erling Smørgrav 		return NULL;
452857bddd21SDag-Erling Smørgrav 	}
452957bddd21SDag-Erling Smørgrav 
453057bddd21SDag-Erling Smørgrav 	return c;
453157bddd21SDag-Erling Smørgrav }
453257bddd21SDag-Erling Smørgrav 
453357bddd21SDag-Erling Smørgrav struct comm_point*
4534b7579f77SDag-Erling Smørgrav comm_point_create_local(struct comm_base *base, int fd, size_t bufsize,
45353005e0a3SDag-Erling Smørgrav         comm_point_callback_type* callback, void* callback_arg)
4536b7579f77SDag-Erling Smørgrav {
4537b7579f77SDag-Erling Smørgrav 	struct comm_point* c = (struct comm_point*)calloc(1,
4538b7579f77SDag-Erling Smørgrav 		sizeof(struct comm_point));
4539b7579f77SDag-Erling Smørgrav 	short evbits;
4540b7579f77SDag-Erling Smørgrav 	if(!c)
4541b7579f77SDag-Erling Smørgrav 		return NULL;
4542b7579f77SDag-Erling Smørgrav 	c->ev = (struct internal_event*)calloc(1,
4543b7579f77SDag-Erling Smørgrav 		sizeof(struct internal_event));
4544b7579f77SDag-Erling Smørgrav 	if(!c->ev) {
4545b7579f77SDag-Erling Smørgrav 		free(c);
4546b7579f77SDag-Erling Smørgrav 		return NULL;
4547b7579f77SDag-Erling Smørgrav 	}
4548b7579f77SDag-Erling Smørgrav 	c->ev->base = base;
4549b7579f77SDag-Erling Smørgrav 	c->fd = fd;
455017d15b25SDag-Erling Smørgrav 	c->buffer = sldns_buffer_new(bufsize);
4551b7579f77SDag-Erling Smørgrav 	if(!c->buffer) {
4552b7579f77SDag-Erling Smørgrav 		free(c->ev);
4553b7579f77SDag-Erling Smørgrav 		free(c);
4554b7579f77SDag-Erling Smørgrav 		return NULL;
4555b7579f77SDag-Erling Smørgrav 	}
4556b7579f77SDag-Erling Smørgrav 	c->timeout = NULL;
4557b7579f77SDag-Erling Smørgrav 	c->tcp_is_reading = 1;
4558b7579f77SDag-Erling Smørgrav 	c->tcp_byte_count = 0;
4559b7579f77SDag-Erling Smørgrav 	c->tcp_parent = NULL;
4560b7579f77SDag-Erling Smørgrav 	c->max_tcp_count = 0;
456109a3aaf3SDag-Erling Smørgrav 	c->cur_tcp_count = 0;
4562b7579f77SDag-Erling Smørgrav 	c->tcp_handlers = NULL;
4563b7579f77SDag-Erling Smørgrav 	c->tcp_free = NULL;
4564b7579f77SDag-Erling Smørgrav 	c->type = comm_local;
4565b7579f77SDag-Erling Smørgrav 	c->tcp_do_close = 0;
4566b7579f77SDag-Erling Smørgrav 	c->do_not_close = 1;
4567b7579f77SDag-Erling Smørgrav 	c->tcp_do_toggle_rw = 0;
4568b7579f77SDag-Erling Smørgrav 	c->tcp_check_nb_connect = 0;
4569b5663de9SDag-Erling Smørgrav #ifdef USE_MSG_FASTOPEN
4570b5663de9SDag-Erling Smørgrav 	c->tcp_do_fastopen = 0;
4571b5663de9SDag-Erling Smørgrav #endif
457265b390aaSDag-Erling Smørgrav #ifdef USE_DNSCRYPT
457365b390aaSDag-Erling Smørgrav 	c->dnscrypt = 0;
457465b390aaSDag-Erling Smørgrav 	c->dnscrypt_buffer = c->buffer;
457565b390aaSDag-Erling Smørgrav #endif
4576b7579f77SDag-Erling Smørgrav 	c->callback = callback;
4577b7579f77SDag-Erling Smørgrav 	c->cb_arg = callback_arg;
4578865f46b2SCy Schubert 	c->pp2_enabled = 0;
4579865f46b2SCy Schubert 	c->pp2_header_state = pp2_header_none;
4580e2d15004SDag-Erling Smørgrav 	/* ub_event stuff */
4581e2d15004SDag-Erling Smørgrav 	evbits = UB_EV_PERSIST | UB_EV_READ;
4582e2d15004SDag-Erling Smørgrav 	c->ev->ev = ub_event_new(base->eb->base, c->fd, evbits,
4583e2d15004SDag-Erling Smørgrav 		comm_point_local_handle_callback, c);
4584e2d15004SDag-Erling Smørgrav 	if(c->ev->ev == NULL) {
4585e2d15004SDag-Erling Smørgrav 		log_err("could not baseset localhdl event");
4586e2d15004SDag-Erling Smørgrav 		free(c->ev);
4587e2d15004SDag-Erling Smørgrav 		free(c);
4588e2d15004SDag-Erling Smørgrav 		return NULL;
4589e2d15004SDag-Erling Smørgrav 	}
4590e2d15004SDag-Erling Smørgrav 	if (ub_event_add(c->ev->ev, c->timeout) != 0) {
4591b7579f77SDag-Erling Smørgrav 		log_err("could not add localhdl event");
4592e2d15004SDag-Erling Smørgrav 		ub_event_free(c->ev->ev);
4593b7579f77SDag-Erling Smørgrav 		free(c->ev);
4594b7579f77SDag-Erling Smørgrav 		free(c);
4595b7579f77SDag-Erling Smørgrav 		return NULL;
4596b7579f77SDag-Erling Smørgrav 	}
4597f44e67d1SCy Schubert 	c->event_added = 1;
4598b7579f77SDag-Erling Smørgrav 	return c;
4599b7579f77SDag-Erling Smørgrav }
4600b7579f77SDag-Erling Smørgrav 
4601b7579f77SDag-Erling Smørgrav struct comm_point*
4602b7579f77SDag-Erling Smørgrav comm_point_create_raw(struct comm_base* base, int fd, int writing,
46033005e0a3SDag-Erling Smørgrav 	comm_point_callback_type* callback, void* callback_arg)
4604b7579f77SDag-Erling Smørgrav {
4605b7579f77SDag-Erling Smørgrav 	struct comm_point* c = (struct comm_point*)calloc(1,
4606b7579f77SDag-Erling Smørgrav 		sizeof(struct comm_point));
4607b7579f77SDag-Erling Smørgrav 	short evbits;
4608b7579f77SDag-Erling Smørgrav 	if(!c)
4609b7579f77SDag-Erling Smørgrav 		return NULL;
4610b7579f77SDag-Erling Smørgrav 	c->ev = (struct internal_event*)calloc(1,
4611b7579f77SDag-Erling Smørgrav 		sizeof(struct internal_event));
4612b7579f77SDag-Erling Smørgrav 	if(!c->ev) {
4613b7579f77SDag-Erling Smørgrav 		free(c);
4614b7579f77SDag-Erling Smørgrav 		return NULL;
4615b7579f77SDag-Erling Smørgrav 	}
4616b7579f77SDag-Erling Smørgrav 	c->ev->base = base;
4617b7579f77SDag-Erling Smørgrav 	c->fd = fd;
4618b7579f77SDag-Erling Smørgrav 	c->buffer = NULL;
4619b7579f77SDag-Erling Smørgrav 	c->timeout = NULL;
4620b7579f77SDag-Erling Smørgrav 	c->tcp_is_reading = 0;
4621b7579f77SDag-Erling Smørgrav 	c->tcp_byte_count = 0;
4622b7579f77SDag-Erling Smørgrav 	c->tcp_parent = NULL;
4623b7579f77SDag-Erling Smørgrav 	c->max_tcp_count = 0;
462409a3aaf3SDag-Erling Smørgrav 	c->cur_tcp_count = 0;
4625b7579f77SDag-Erling Smørgrav 	c->tcp_handlers = NULL;
4626b7579f77SDag-Erling Smørgrav 	c->tcp_free = NULL;
4627b7579f77SDag-Erling Smørgrav 	c->type = comm_raw;
4628b7579f77SDag-Erling Smørgrav 	c->tcp_do_close = 0;
4629b7579f77SDag-Erling Smørgrav 	c->do_not_close = 1;
4630b7579f77SDag-Erling Smørgrav 	c->tcp_do_toggle_rw = 0;
4631b7579f77SDag-Erling Smørgrav 	c->tcp_check_nb_connect = 0;
4632b5663de9SDag-Erling Smørgrav #ifdef USE_MSG_FASTOPEN
4633b5663de9SDag-Erling Smørgrav 	c->tcp_do_fastopen = 0;
4634b5663de9SDag-Erling Smørgrav #endif
463565b390aaSDag-Erling Smørgrav #ifdef USE_DNSCRYPT
463665b390aaSDag-Erling Smørgrav 	c->dnscrypt = 0;
463765b390aaSDag-Erling Smørgrav 	c->dnscrypt_buffer = c->buffer;
463865b390aaSDag-Erling Smørgrav #endif
4639b7579f77SDag-Erling Smørgrav 	c->callback = callback;
4640b7579f77SDag-Erling Smørgrav 	c->cb_arg = callback_arg;
4641865f46b2SCy Schubert 	c->pp2_enabled = 0;
4642865f46b2SCy Schubert 	c->pp2_header_state = pp2_header_none;
4643e2d15004SDag-Erling Smørgrav 	/* ub_event stuff */
4644b7579f77SDag-Erling Smørgrav 	if(writing)
4645e2d15004SDag-Erling Smørgrav 		evbits = UB_EV_PERSIST | UB_EV_WRITE;
4646e2d15004SDag-Erling Smørgrav 	else 	evbits = UB_EV_PERSIST | UB_EV_READ;
4647e2d15004SDag-Erling Smørgrav 	c->ev->ev = ub_event_new(base->eb->base, c->fd, evbits,
4648e2d15004SDag-Erling Smørgrav 		comm_point_raw_handle_callback, c);
4649e2d15004SDag-Erling Smørgrav 	if(c->ev->ev == NULL) {
4650e2d15004SDag-Erling Smørgrav 		log_err("could not baseset rawhdl event");
4651e2d15004SDag-Erling Smørgrav 		free(c->ev);
4652e2d15004SDag-Erling Smørgrav 		free(c);
4653e2d15004SDag-Erling Smørgrav 		return NULL;
4654e2d15004SDag-Erling Smørgrav 	}
4655e2d15004SDag-Erling Smørgrav 	if (ub_event_add(c->ev->ev, c->timeout) != 0) {
4656b7579f77SDag-Erling Smørgrav 		log_err("could not add rawhdl event");
4657e2d15004SDag-Erling Smørgrav 		ub_event_free(c->ev->ev);
4658b7579f77SDag-Erling Smørgrav 		free(c->ev);
4659b7579f77SDag-Erling Smørgrav 		free(c);
4660b7579f77SDag-Erling Smørgrav 		return NULL;
4661b7579f77SDag-Erling Smørgrav 	}
4662f44e67d1SCy Schubert 	c->event_added = 1;
4663b7579f77SDag-Erling Smørgrav 	return c;
4664b7579f77SDag-Erling Smørgrav }
4665b7579f77SDag-Erling Smørgrav 
4666b7579f77SDag-Erling Smørgrav void
4667b7579f77SDag-Erling Smørgrav comm_point_close(struct comm_point* c)
4668b7579f77SDag-Erling Smørgrav {
4669b7579f77SDag-Erling Smørgrav 	if(!c)
4670b7579f77SDag-Erling Smørgrav 		return;
46713bd4df0aSDag-Erling Smørgrav 	if(c->fd != -1) {
4672369c6923SCy Schubert 		verbose(5, "comm_point_close of %d: event_del", c->fd);
4673f44e67d1SCy Schubert 		if(c->event_added) {
4674e2d15004SDag-Erling Smørgrav 			if(ub_event_del(c->ev->ev) != 0) {
4675b7579f77SDag-Erling Smørgrav 				log_err("could not event_del on close");
4676b7579f77SDag-Erling Smørgrav 			}
4677f44e67d1SCy Schubert 			c->event_added = 0;
4678f44e67d1SCy Schubert 		}
46793bd4df0aSDag-Erling Smørgrav 	}
46804c75e3aaSDag-Erling Smørgrav 	tcl_close_connection(c->tcl_addr);
4681e86b9096SDag-Erling Smørgrav 	if(c->tcp_req_info)
4682e86b9096SDag-Erling Smørgrav 		tcp_req_info_clear(c->tcp_req_info);
4683c0caa2e2SCy Schubert 	if(c->h2_session)
4684c0caa2e2SCy Schubert 		http2_session_server_delete(c->h2_session);
46851838dec3SCy Schubert 	/* stop the comm point from reading or writing after it is closed. */
46861838dec3SCy Schubert 	if(c->tcp_more_read_again && *c->tcp_more_read_again)
46871838dec3SCy Schubert 		*c->tcp_more_read_again = 0;
46881838dec3SCy Schubert 	if(c->tcp_more_write_again && *c->tcp_more_write_again)
46891838dec3SCy Schubert 		*c->tcp_more_write_again = 0;
4690c0caa2e2SCy Schubert 
4691b7579f77SDag-Erling Smørgrav 	/* close fd after removing from event lists, or epoll.. is messed up */
4692b7579f77SDag-Erling Smørgrav 	if(c->fd != -1 && !c->do_not_close) {
46935469a995SCy Schubert #ifdef USE_WINSOCK
46943bd4df0aSDag-Erling Smørgrav 		if(c->type == comm_tcp || c->type == comm_http) {
46953bd4df0aSDag-Erling Smørgrav 			/* delete sticky events for the fd, it gets closed */
46963bd4df0aSDag-Erling Smørgrav 			ub_winsock_tcp_wouldblock(c->ev->ev, UB_EV_READ);
46973bd4df0aSDag-Erling Smørgrav 			ub_winsock_tcp_wouldblock(c->ev->ev, UB_EV_WRITE);
46983bd4df0aSDag-Erling Smørgrav 		}
46995469a995SCy Schubert #endif
4700b7579f77SDag-Erling Smørgrav 		verbose(VERB_ALGO, "close fd %d", c->fd);
4701c0caa2e2SCy Schubert 		sock_close(c->fd);
4702b7579f77SDag-Erling Smørgrav 	}
4703b7579f77SDag-Erling Smørgrav 	c->fd = -1;
4704b7579f77SDag-Erling Smørgrav }
4705b7579f77SDag-Erling Smørgrav 
4706b7579f77SDag-Erling Smørgrav void
4707b7579f77SDag-Erling Smørgrav comm_point_delete(struct comm_point* c)
4708b7579f77SDag-Erling Smørgrav {
4709b7579f77SDag-Erling Smørgrav 	if(!c)
4710b7579f77SDag-Erling Smørgrav 		return;
471157bddd21SDag-Erling Smørgrav 	if((c->type == comm_tcp || c->type == comm_http) && c->ssl) {
47128ed2b524SDag-Erling Smørgrav #ifdef HAVE_SSL
4713b7579f77SDag-Erling Smørgrav 		SSL_shutdown(c->ssl);
4714b7579f77SDag-Erling Smørgrav 		SSL_free(c->ssl);
47158ed2b524SDag-Erling Smørgrav #endif
4716b7579f77SDag-Erling Smørgrav 	}
4717c0caa2e2SCy Schubert 	if(c->type == comm_http && c->http_endpoint) {
4718c0caa2e2SCy Schubert 		free(c->http_endpoint);
4719c0caa2e2SCy Schubert 		c->http_endpoint = NULL;
4720c0caa2e2SCy Schubert 	}
4721b7579f77SDag-Erling Smørgrav 	comm_point_close(c);
4722b7579f77SDag-Erling Smørgrav 	if(c->tcp_handlers) {
4723b7579f77SDag-Erling Smørgrav 		int i;
4724b7579f77SDag-Erling Smørgrav 		for(i=0; i<c->max_tcp_count; i++)
4725b7579f77SDag-Erling Smørgrav 			comm_point_delete(c->tcp_handlers[i]);
4726b7579f77SDag-Erling Smørgrav 		free(c->tcp_handlers);
4727b7579f77SDag-Erling Smørgrav 	}
4728b7579f77SDag-Erling Smørgrav 	free(c->timeout);
472957bddd21SDag-Erling Smørgrav 	if(c->type == comm_tcp || c->type == comm_local || c->type == comm_http) {
473017d15b25SDag-Erling Smørgrav 		sldns_buffer_free(c->buffer);
473165b390aaSDag-Erling Smørgrav #ifdef USE_DNSCRYPT
473265b390aaSDag-Erling Smørgrav 		if(c->dnscrypt && c->dnscrypt_buffer != c->buffer) {
473365b390aaSDag-Erling Smørgrav 			sldns_buffer_free(c->dnscrypt_buffer);
473465b390aaSDag-Erling Smørgrav 		}
473565b390aaSDag-Erling Smørgrav #endif
4736e86b9096SDag-Erling Smørgrav 		if(c->tcp_req_info) {
4737e86b9096SDag-Erling Smørgrav 			tcp_req_info_delete(c->tcp_req_info);
4738e86b9096SDag-Erling Smørgrav 		}
4739c0caa2e2SCy Schubert 		if(c->h2_session) {
4740c0caa2e2SCy Schubert 			http2_session_delete(c->h2_session);
4741c0caa2e2SCy Schubert 		}
474265b390aaSDag-Erling Smørgrav 	}
4743e2d15004SDag-Erling Smørgrav 	ub_event_free(c->ev->ev);
4744b7579f77SDag-Erling Smørgrav 	free(c->ev);
4745b7579f77SDag-Erling Smørgrav 	free(c);
4746b7579f77SDag-Erling Smørgrav }
4747b7579f77SDag-Erling Smørgrav 
4748b7579f77SDag-Erling Smørgrav void
4749b7579f77SDag-Erling Smørgrav comm_point_send_reply(struct comm_reply *repinfo)
4750b7579f77SDag-Erling Smørgrav {
475165b390aaSDag-Erling Smørgrav 	struct sldns_buffer* buffer;
4752b7579f77SDag-Erling Smørgrav 	log_assert(repinfo && repinfo->c);
475365b390aaSDag-Erling Smørgrav #ifdef USE_DNSCRYPT
475465b390aaSDag-Erling Smørgrav 	buffer = repinfo->c->dnscrypt_buffer;
475565b390aaSDag-Erling Smørgrav 	if(!dnsc_handle_uncurved_request(repinfo)) {
475665b390aaSDag-Erling Smørgrav 		return;
475765b390aaSDag-Erling Smørgrav 	}
475865b390aaSDag-Erling Smørgrav #else
475965b390aaSDag-Erling Smørgrav 	buffer = repinfo->c->buffer;
476065b390aaSDag-Erling Smørgrav #endif
4761b7579f77SDag-Erling Smørgrav 	if(repinfo->c->type == comm_udp) {
4762b7579f77SDag-Erling Smørgrav 		if(repinfo->srctype)
4763865f46b2SCy Schubert 			comm_point_send_udp_msg_if(repinfo->c, buffer,
4764865f46b2SCy Schubert 				(struct sockaddr*)&repinfo->remote_addr,
4765865f46b2SCy Schubert 				repinfo->remote_addrlen, repinfo);
4766b7579f77SDag-Erling Smørgrav 		else
476765b390aaSDag-Erling Smørgrav 			comm_point_send_udp_msg(repinfo->c, buffer,
4768865f46b2SCy Schubert 				(struct sockaddr*)&repinfo->remote_addr,
4769865f46b2SCy Schubert 				repinfo->remote_addrlen, 0);
4770ff825849SDag-Erling Smørgrav #ifdef USE_DNSTAP
47715469a995SCy Schubert 		/*
47725469a995SCy Schubert 		 * sending src (client)/dst (local service) addresses over DNSTAP from udp callback
47735469a995SCy Schubert 		 */
47745469a995SCy Schubert 		if(repinfo->c->dtenv != NULL && repinfo->c->dtenv->log_client_response_messages) {
47755469a995SCy Schubert 			log_addr(VERB_ALGO, "from local addr", (void*)repinfo->c->socket->addr->ai_addr, repinfo->c->socket->addr->ai_addrlen);
4776865f46b2SCy Schubert 			log_addr(VERB_ALGO, "response to client", &repinfo->client_addr, repinfo->client_addrlen);
4777*b7c0c8c1SCy Schubert 			dt_msg_send_client_response(repinfo->c->dtenv, &repinfo->client_addr, (void*)repinfo->c->socket->addr->ai_addr, repinfo->c->type, repinfo->c->ssl, repinfo->c->buffer);
47785469a995SCy Schubert 		}
4779ff825849SDag-Erling Smørgrav #endif
4780b7579f77SDag-Erling Smørgrav 	} else {
4781ff825849SDag-Erling Smørgrav #ifdef USE_DNSTAP
47825469a995SCy Schubert 		/*
47835469a995SCy Schubert 		 * sending src (client)/dst (local service) addresses over DNSTAP from TCP callback
47845469a995SCy Schubert 		 */
47855469a995SCy Schubert 		if(repinfo->c->tcp_parent->dtenv != NULL && repinfo->c->tcp_parent->dtenv->log_client_response_messages) {
47865469a995SCy Schubert 			log_addr(VERB_ALGO, "from local addr", (void*)repinfo->c->socket->addr->ai_addr, repinfo->c->socket->addr->ai_addrlen);
4787865f46b2SCy Schubert 			log_addr(VERB_ALGO, "response to client", &repinfo->client_addr, repinfo->client_addrlen);
4788*b7c0c8c1SCy Schubert 			dt_msg_send_client_response(repinfo->c->tcp_parent->dtenv, &repinfo->client_addr, (void*)repinfo->c->socket->addr->ai_addr, repinfo->c->type, repinfo->c->ssl,
47895469a995SCy Schubert 				( repinfo->c->tcp_req_info? repinfo->c->tcp_req_info->spool_buffer: repinfo->c->buffer ));
47905469a995SCy Schubert 		}
4791ff825849SDag-Erling Smørgrav #endif
4792e86b9096SDag-Erling Smørgrav 		if(repinfo->c->tcp_req_info) {
4793e86b9096SDag-Erling Smørgrav 			tcp_req_info_send_reply(repinfo->c->tcp_req_info);
4794c0caa2e2SCy Schubert 		} else if(repinfo->c->use_h2) {
4795c0caa2e2SCy Schubert 			if(!http2_submit_dns_response(repinfo->c->h2_session)) {
4796c0caa2e2SCy Schubert 				comm_point_drop_reply(repinfo);
4797c0caa2e2SCy Schubert 				return;
4798c0caa2e2SCy Schubert 			}
4799c0caa2e2SCy Schubert 			repinfo->c->h2_stream = NULL;
4800c0caa2e2SCy Schubert 			repinfo->c->tcp_is_reading = 0;
4801c0caa2e2SCy Schubert 			comm_point_stop_listening(repinfo->c);
4802c0caa2e2SCy Schubert 			comm_point_start_listening(repinfo->c, -1,
4803f44e67d1SCy Schubert 				adjusted_tcp_timeout(repinfo->c));
4804c0caa2e2SCy Schubert 			return;
4805e86b9096SDag-Erling Smørgrav 		} else {
4806b5663de9SDag-Erling Smørgrav 			comm_point_start_listening(repinfo->c, -1,
4807f44e67d1SCy Schubert 				adjusted_tcp_timeout(repinfo->c));
4808b7579f77SDag-Erling Smørgrav 		}
4809b7579f77SDag-Erling Smørgrav 	}
4810e86b9096SDag-Erling Smørgrav }
4811b7579f77SDag-Erling Smørgrav 
4812b7579f77SDag-Erling Smørgrav void
4813b7579f77SDag-Erling Smørgrav comm_point_drop_reply(struct comm_reply* repinfo)
4814b7579f77SDag-Erling Smørgrav {
4815b7579f77SDag-Erling Smørgrav 	if(!repinfo)
4816b7579f77SDag-Erling Smørgrav 		return;
48170eefd307SCy Schubert 	log_assert(repinfo->c);
4818b7579f77SDag-Erling Smørgrav 	log_assert(repinfo->c->type != comm_tcp_accept);
4819b7579f77SDag-Erling Smørgrav 	if(repinfo->c->type == comm_udp)
4820b7579f77SDag-Erling Smørgrav 		return;
4821e86b9096SDag-Erling Smørgrav 	if(repinfo->c->tcp_req_info)
4822e86b9096SDag-Erling Smørgrav 		repinfo->c->tcp_req_info->is_drop = 1;
4823c0caa2e2SCy Schubert 	if(repinfo->c->type == comm_http) {
4824c0caa2e2SCy Schubert 		if(repinfo->c->h2_session) {
4825c0caa2e2SCy Schubert 			repinfo->c->h2_session->is_drop = 1;
4826c0caa2e2SCy Schubert 			if(!repinfo->c->h2_session->postpone_drop)
4827c0caa2e2SCy Schubert 				reclaim_http_handler(repinfo->c);
4828c0caa2e2SCy Schubert 			return;
4829c0caa2e2SCy Schubert 		}
4830c0caa2e2SCy Schubert 		reclaim_http_handler(repinfo->c);
4831c0caa2e2SCy Schubert 		return;
4832c0caa2e2SCy Schubert 	}
4833b7579f77SDag-Erling Smørgrav 	reclaim_tcp_handler(repinfo->c);
4834b7579f77SDag-Erling Smørgrav }
4835b7579f77SDag-Erling Smørgrav 
4836b7579f77SDag-Erling Smørgrav void
4837b7579f77SDag-Erling Smørgrav comm_point_stop_listening(struct comm_point* c)
4838b7579f77SDag-Erling Smørgrav {
4839b7579f77SDag-Erling Smørgrav 	verbose(VERB_ALGO, "comm point stop listening %d", c->fd);
4840f44e67d1SCy Schubert 	if(c->event_added) {
4841e2d15004SDag-Erling Smørgrav 		if(ub_event_del(c->ev->ev) != 0) {
4842b7579f77SDag-Erling Smørgrav 			log_err("event_del error to stoplisten");
4843b7579f77SDag-Erling Smørgrav 		}
4844f44e67d1SCy Schubert 		c->event_added = 0;
4845f44e67d1SCy Schubert 	}
4846b7579f77SDag-Erling Smørgrav }
4847b7579f77SDag-Erling Smørgrav 
4848b7579f77SDag-Erling Smørgrav void
4849b5663de9SDag-Erling Smørgrav comm_point_start_listening(struct comm_point* c, int newfd, int msec)
4850b7579f77SDag-Erling Smørgrav {
4851e86b9096SDag-Erling Smørgrav 	verbose(VERB_ALGO, "comm point start listening %d (%d msec)",
4852e86b9096SDag-Erling Smørgrav 		c->fd==-1?newfd:c->fd, msec);
4853b7579f77SDag-Erling Smørgrav 	if(c->type == comm_tcp_accept && !c->tcp_free) {
4854b7579f77SDag-Erling Smørgrav 		/* no use to start listening no free slots. */
4855b7579f77SDag-Erling Smørgrav 		return;
4856b7579f77SDag-Erling Smørgrav 	}
4857f44e67d1SCy Schubert 	if(c->event_added) {
4858f44e67d1SCy Schubert 		if(ub_event_del(c->ev->ev) != 0) {
4859f44e67d1SCy Schubert 			log_err("event_del error to startlisten");
4860f44e67d1SCy Schubert 		}
4861f44e67d1SCy Schubert 		c->event_added = 0;
4862f44e67d1SCy Schubert 	}
4863b5663de9SDag-Erling Smørgrav 	if(msec != -1 && msec != 0) {
4864b7579f77SDag-Erling Smørgrav 		if(!c->timeout) {
4865b7579f77SDag-Erling Smørgrav 			c->timeout = (struct timeval*)malloc(sizeof(
4866b7579f77SDag-Erling Smørgrav 				struct timeval));
4867b7579f77SDag-Erling Smørgrav 			if(!c->timeout) {
4868b7579f77SDag-Erling Smørgrav 				log_err("cpsl: malloc failed. No net read.");
4869b7579f77SDag-Erling Smørgrav 				return;
4870b7579f77SDag-Erling Smørgrav 			}
4871b7579f77SDag-Erling Smørgrav 		}
4872e2d15004SDag-Erling Smørgrav 		ub_event_add_bits(c->ev->ev, UB_EV_TIMEOUT);
4873b7579f77SDag-Erling Smørgrav #ifndef S_SPLINT_S /* splint fails on struct timeval. */
4874b5663de9SDag-Erling Smørgrav 		c->timeout->tv_sec = msec/1000;
4875b5663de9SDag-Erling Smørgrav 		c->timeout->tv_usec = (msec%1000)*1000;
4876b7579f77SDag-Erling Smørgrav #endif /* S_SPLINT_S */
487724e36522SCy Schubert 	} else {
487824e36522SCy Schubert 		if(msec == 0 || !c->timeout) {
487924e36522SCy Schubert 			ub_event_del_bits(c->ev->ev, UB_EV_TIMEOUT);
488024e36522SCy Schubert 		}
4881b7579f77SDag-Erling Smørgrav 	}
488257bddd21SDag-Erling Smørgrav 	if(c->type == comm_tcp || c->type == comm_http) {
4883e2d15004SDag-Erling Smørgrav 		ub_event_del_bits(c->ev->ev, UB_EV_READ|UB_EV_WRITE);
4884369c6923SCy Schubert 		if(c->tcp_write_and_read) {
4885369c6923SCy Schubert 			verbose(5, "startlistening %d mode rw", (newfd==-1?c->fd:newfd));
4886369c6923SCy Schubert 			ub_event_add_bits(c->ev->ev, UB_EV_READ|UB_EV_WRITE);
4887369c6923SCy Schubert 		} else if(c->tcp_is_reading) {
4888369c6923SCy Schubert 			verbose(5, "startlistening %d mode r", (newfd==-1?c->fd:newfd));
4889e2d15004SDag-Erling Smørgrav 			ub_event_add_bits(c->ev->ev, UB_EV_READ);
4890369c6923SCy Schubert 		} else	{
4891369c6923SCy Schubert 			verbose(5, "startlistening %d mode w", (newfd==-1?c->fd:newfd));
4892369c6923SCy Schubert 			ub_event_add_bits(c->ev->ev, UB_EV_WRITE);
4893369c6923SCy Schubert 		}
4894b7579f77SDag-Erling Smørgrav 	}
4895b7579f77SDag-Erling Smørgrav 	if(newfd != -1) {
4896369c6923SCy Schubert 		if(c->fd != -1 && c->fd != newfd) {
4897369c6923SCy Schubert 			verbose(5, "cpsl close of fd %d for %d", c->fd, newfd);
4898c0caa2e2SCy Schubert 			sock_close(c->fd);
4899b7579f77SDag-Erling Smørgrav 		}
4900b7579f77SDag-Erling Smørgrav 		c->fd = newfd;
4901e2d15004SDag-Erling Smørgrav 		ub_event_set_fd(c->ev->ev, c->fd);
4902b7579f77SDag-Erling Smørgrav 	}
4903b5663de9SDag-Erling Smørgrav 	if(ub_event_add(c->ev->ev, msec==0?NULL:c->timeout) != 0) {
4904b7579f77SDag-Erling Smørgrav 		log_err("event_add failed. in cpsl.");
490524e36522SCy Schubert 		return;
4906b7579f77SDag-Erling Smørgrav 	}
4907f44e67d1SCy Schubert 	c->event_added = 1;
4908b7579f77SDag-Erling Smørgrav }
4909b7579f77SDag-Erling Smørgrav 
4910b7579f77SDag-Erling Smørgrav void comm_point_listen_for_rw(struct comm_point* c, int rd, int wr)
4911b7579f77SDag-Erling Smørgrav {
4912b7579f77SDag-Erling Smørgrav 	verbose(VERB_ALGO, "comm point listen_for_rw %d %d", c->fd, wr);
4913f44e67d1SCy Schubert 	if(c->event_added) {
4914e2d15004SDag-Erling Smørgrav 		if(ub_event_del(c->ev->ev) != 0) {
4915b7579f77SDag-Erling Smørgrav 			log_err("event_del error to cplf");
4916b7579f77SDag-Erling Smørgrav 		}
4917f44e67d1SCy Schubert 		c->event_added = 0;
4918f44e67d1SCy Schubert 	}
491924e36522SCy Schubert 	if(!c->timeout) {
492024e36522SCy Schubert 		ub_event_del_bits(c->ev->ev, UB_EV_TIMEOUT);
492124e36522SCy Schubert 	}
4922e2d15004SDag-Erling Smørgrav 	ub_event_del_bits(c->ev->ev, UB_EV_READ|UB_EV_WRITE);
4923e2d15004SDag-Erling Smørgrav 	if(rd) ub_event_add_bits(c->ev->ev, UB_EV_READ);
4924e2d15004SDag-Erling Smørgrav 	if(wr) ub_event_add_bits(c->ev->ev, UB_EV_WRITE);
4925e2d15004SDag-Erling Smørgrav 	if(ub_event_add(c->ev->ev, c->timeout) != 0) {
4926b7579f77SDag-Erling Smørgrav 		log_err("event_add failed. in cplf.");
492724e36522SCy Schubert 		return;
4928b7579f77SDag-Erling Smørgrav 	}
4929f44e67d1SCy Schubert 	c->event_added = 1;
4930b7579f77SDag-Erling Smørgrav }
4931b7579f77SDag-Erling Smørgrav 
4932b7579f77SDag-Erling Smørgrav size_t comm_point_get_mem(struct comm_point* c)
4933b7579f77SDag-Erling Smørgrav {
4934b7579f77SDag-Erling Smørgrav 	size_t s;
4935b7579f77SDag-Erling Smørgrav 	if(!c)
4936b7579f77SDag-Erling Smørgrav 		return 0;
4937b7579f77SDag-Erling Smørgrav 	s = sizeof(*c) + sizeof(*c->ev);
4938b7579f77SDag-Erling Smørgrav 	if(c->timeout)
4939b7579f77SDag-Erling Smørgrav 		s += sizeof(*c->timeout);
494065b390aaSDag-Erling Smørgrav 	if(c->type == comm_tcp || c->type == comm_local) {
494117d15b25SDag-Erling Smørgrav 		s += sizeof(*c->buffer) + sldns_buffer_capacity(c->buffer);
494265b390aaSDag-Erling Smørgrav #ifdef USE_DNSCRYPT
494365b390aaSDag-Erling Smørgrav 		s += sizeof(*c->dnscrypt_buffer);
494465b390aaSDag-Erling Smørgrav 		if(c->buffer != c->dnscrypt_buffer) {
494565b390aaSDag-Erling Smørgrav 			s += sldns_buffer_capacity(c->dnscrypt_buffer);
494665b390aaSDag-Erling Smørgrav 		}
494765b390aaSDag-Erling Smørgrav #endif
494865b390aaSDag-Erling Smørgrav 	}
4949b7579f77SDag-Erling Smørgrav 	if(c->type == comm_tcp_accept) {
4950b7579f77SDag-Erling Smørgrav 		int i;
4951b7579f77SDag-Erling Smørgrav 		for(i=0; i<c->max_tcp_count; i++)
4952b7579f77SDag-Erling Smørgrav 			s += comm_point_get_mem(c->tcp_handlers[i]);
4953b7579f77SDag-Erling Smørgrav 	}
4954b7579f77SDag-Erling Smørgrav 	return s;
4955b7579f77SDag-Erling Smørgrav }
4956b7579f77SDag-Erling Smørgrav 
4957b7579f77SDag-Erling Smørgrav struct comm_timer*
4958b7579f77SDag-Erling Smørgrav comm_timer_create(struct comm_base* base, void (*cb)(void*), void* cb_arg)
4959b7579f77SDag-Erling Smørgrav {
4960e2d15004SDag-Erling Smørgrav 	struct internal_timer *tm = (struct internal_timer*)calloc(1,
4961b7579f77SDag-Erling Smørgrav 		sizeof(struct internal_timer));
4962e2d15004SDag-Erling Smørgrav 	if(!tm) {
4963b7579f77SDag-Erling Smørgrav 		log_err("malloc failed");
4964b7579f77SDag-Erling Smørgrav 		return NULL;
4965b7579f77SDag-Erling Smørgrav 	}
4966e2d15004SDag-Erling Smørgrav 	tm->super.ev_timer = tm;
4967e2d15004SDag-Erling Smørgrav 	tm->base = base;
4968e2d15004SDag-Erling Smørgrav 	tm->super.callback = cb;
4969e2d15004SDag-Erling Smørgrav 	tm->super.cb_arg = cb_arg;
4970e2d15004SDag-Erling Smørgrav 	tm->ev = ub_event_new(base->eb->base, -1, UB_EV_TIMEOUT,
4971e2d15004SDag-Erling Smørgrav 		comm_timer_callback, &tm->super);
4972e2d15004SDag-Erling Smørgrav 	if(tm->ev == NULL) {
4973b7579f77SDag-Erling Smørgrav 		log_err("timer_create: event_base_set failed.");
4974b7579f77SDag-Erling Smørgrav 		free(tm);
4975b7579f77SDag-Erling Smørgrav 		return NULL;
4976b7579f77SDag-Erling Smørgrav 	}
4977e2d15004SDag-Erling Smørgrav 	return &tm->super;
4978b7579f77SDag-Erling Smørgrav }
4979b7579f77SDag-Erling Smørgrav 
4980b7579f77SDag-Erling Smørgrav void
4981b7579f77SDag-Erling Smørgrav comm_timer_disable(struct comm_timer* timer)
4982b7579f77SDag-Erling Smørgrav {
4983b7579f77SDag-Erling Smørgrav 	if(!timer)
4984b7579f77SDag-Erling Smørgrav 		return;
4985e2d15004SDag-Erling Smørgrav 	ub_timer_del(timer->ev_timer->ev);
4986b7579f77SDag-Erling Smørgrav 	timer->ev_timer->enabled = 0;
4987b7579f77SDag-Erling Smørgrav }
4988b7579f77SDag-Erling Smørgrav 
4989b7579f77SDag-Erling Smørgrav void
4990b7579f77SDag-Erling Smørgrav comm_timer_set(struct comm_timer* timer, struct timeval* tv)
4991b7579f77SDag-Erling Smørgrav {
4992b7579f77SDag-Erling Smørgrav 	log_assert(tv);
4993b7579f77SDag-Erling Smørgrav 	if(timer->ev_timer->enabled)
4994b7579f77SDag-Erling Smørgrav 		comm_timer_disable(timer);
4995e2d15004SDag-Erling Smørgrav 	if(ub_timer_add(timer->ev_timer->ev, timer->ev_timer->base->eb->base,
4996e2d15004SDag-Erling Smørgrav 		comm_timer_callback, timer, tv) != 0)
4997b7579f77SDag-Erling Smørgrav 		log_err("comm_timer_set: evtimer_add failed.");
4998b7579f77SDag-Erling Smørgrav 	timer->ev_timer->enabled = 1;
4999b7579f77SDag-Erling Smørgrav }
5000b7579f77SDag-Erling Smørgrav 
5001b7579f77SDag-Erling Smørgrav void
5002b7579f77SDag-Erling Smørgrav comm_timer_delete(struct comm_timer* timer)
5003b7579f77SDag-Erling Smørgrav {
5004b7579f77SDag-Erling Smørgrav 	if(!timer)
5005b7579f77SDag-Erling Smørgrav 		return;
5006b7579f77SDag-Erling Smørgrav 	comm_timer_disable(timer);
5007e2d15004SDag-Erling Smørgrav 	/* Free the sub struct timer->ev_timer derived from the super struct timer.
5008e2d15004SDag-Erling Smørgrav 	 * i.e. assert(timer == timer->ev_timer)
5009e2d15004SDag-Erling Smørgrav 	 */
5010e2d15004SDag-Erling Smørgrav 	ub_event_free(timer->ev_timer->ev);
5011b7579f77SDag-Erling Smørgrav 	free(timer->ev_timer);
5012b7579f77SDag-Erling Smørgrav }
5013b7579f77SDag-Erling Smørgrav 
5014b7579f77SDag-Erling Smørgrav void
5015b7579f77SDag-Erling Smørgrav comm_timer_callback(int ATTR_UNUSED(fd), short event, void* arg)
5016b7579f77SDag-Erling Smørgrav {
5017b7579f77SDag-Erling Smørgrav 	struct comm_timer* tm = (struct comm_timer*)arg;
5018e2d15004SDag-Erling Smørgrav 	if(!(event&UB_EV_TIMEOUT))
5019b7579f77SDag-Erling Smørgrav 		return;
5020e2d15004SDag-Erling Smørgrav 	ub_comm_base_now(tm->ev_timer->base);
5021b7579f77SDag-Erling Smørgrav 	tm->ev_timer->enabled = 0;
5022b7579f77SDag-Erling Smørgrav 	fptr_ok(fptr_whitelist_comm_timer(tm->callback));
5023b7579f77SDag-Erling Smørgrav 	(*tm->callback)(tm->cb_arg);
5024b7579f77SDag-Erling Smørgrav }
5025b7579f77SDag-Erling Smørgrav 
5026b7579f77SDag-Erling Smørgrav int
5027b7579f77SDag-Erling Smørgrav comm_timer_is_set(struct comm_timer* timer)
5028b7579f77SDag-Erling Smørgrav {
5029b7579f77SDag-Erling Smørgrav 	return (int)timer->ev_timer->enabled;
5030b7579f77SDag-Erling Smørgrav }
5031b7579f77SDag-Erling Smørgrav 
5032b7579f77SDag-Erling Smørgrav size_t
5033e2d15004SDag-Erling Smørgrav comm_timer_get_mem(struct comm_timer* ATTR_UNUSED(timer))
5034b7579f77SDag-Erling Smørgrav {
5035e2d15004SDag-Erling Smørgrav 	return sizeof(struct internal_timer);
5036b7579f77SDag-Erling Smørgrav }
5037b7579f77SDag-Erling Smørgrav 
5038b7579f77SDag-Erling Smørgrav struct comm_signal*
5039b7579f77SDag-Erling Smørgrav comm_signal_create(struct comm_base* base,
5040b7579f77SDag-Erling Smørgrav         void (*callback)(int, void*), void* cb_arg)
5041b7579f77SDag-Erling Smørgrav {
5042b7579f77SDag-Erling Smørgrav 	struct comm_signal* com = (struct comm_signal*)malloc(
5043b7579f77SDag-Erling Smørgrav 		sizeof(struct comm_signal));
5044b7579f77SDag-Erling Smørgrav 	if(!com) {
5045b7579f77SDag-Erling Smørgrav 		log_err("malloc failed");
5046b7579f77SDag-Erling Smørgrav 		return NULL;
5047b7579f77SDag-Erling Smørgrav 	}
5048b7579f77SDag-Erling Smørgrav 	com->base = base;
5049b7579f77SDag-Erling Smørgrav 	com->callback = callback;
5050b7579f77SDag-Erling Smørgrav 	com->cb_arg = cb_arg;
5051b7579f77SDag-Erling Smørgrav 	com->ev_signal = NULL;
5052b7579f77SDag-Erling Smørgrav 	return com;
5053b7579f77SDag-Erling Smørgrav }
5054b7579f77SDag-Erling Smørgrav 
5055b7579f77SDag-Erling Smørgrav void
5056b7579f77SDag-Erling Smørgrav comm_signal_callback(int sig, short event, void* arg)
5057b7579f77SDag-Erling Smørgrav {
5058b7579f77SDag-Erling Smørgrav 	struct comm_signal* comsig = (struct comm_signal*)arg;
5059e2d15004SDag-Erling Smørgrav 	if(!(event & UB_EV_SIGNAL))
5060b7579f77SDag-Erling Smørgrav 		return;
5061e2d15004SDag-Erling Smørgrav 	ub_comm_base_now(comsig->base);
5062b7579f77SDag-Erling Smørgrav 	fptr_ok(fptr_whitelist_comm_signal(comsig->callback));
5063b7579f77SDag-Erling Smørgrav 	(*comsig->callback)(sig, comsig->cb_arg);
5064b7579f77SDag-Erling Smørgrav }
5065b7579f77SDag-Erling Smørgrav 
5066b7579f77SDag-Erling Smørgrav int
5067b7579f77SDag-Erling Smørgrav comm_signal_bind(struct comm_signal* comsig, int sig)
5068b7579f77SDag-Erling Smørgrav {
5069b7579f77SDag-Erling Smørgrav 	struct internal_signal* entry = (struct internal_signal*)calloc(1,
5070b7579f77SDag-Erling Smørgrav 		sizeof(struct internal_signal));
5071b7579f77SDag-Erling Smørgrav 	if(!entry) {
5072b7579f77SDag-Erling Smørgrav 		log_err("malloc failed");
5073b7579f77SDag-Erling Smørgrav 		return 0;
5074b7579f77SDag-Erling Smørgrav 	}
5075b7579f77SDag-Erling Smørgrav 	log_assert(comsig);
5076b7579f77SDag-Erling Smørgrav 	/* add signal event */
5077e2d15004SDag-Erling Smørgrav 	entry->ev = ub_signal_new(comsig->base->eb->base, sig,
5078e2d15004SDag-Erling Smørgrav 		comm_signal_callback, comsig);
5079e2d15004SDag-Erling Smørgrav 	if(entry->ev == NULL) {
5080e2d15004SDag-Erling Smørgrav 		log_err("Could not create signal event");
5081b7579f77SDag-Erling Smørgrav 		free(entry);
5082b7579f77SDag-Erling Smørgrav 		return 0;
5083b7579f77SDag-Erling Smørgrav 	}
5084e2d15004SDag-Erling Smørgrav 	if(ub_signal_add(entry->ev, NULL) != 0) {
5085b7579f77SDag-Erling Smørgrav 		log_err("Could not add signal handler");
5086e2d15004SDag-Erling Smørgrav 		ub_event_free(entry->ev);
5087b7579f77SDag-Erling Smørgrav 		free(entry);
5088b7579f77SDag-Erling Smørgrav 		return 0;
5089b7579f77SDag-Erling Smørgrav 	}
5090b7579f77SDag-Erling Smørgrav 	/* link into list */
5091b7579f77SDag-Erling Smørgrav 	entry->next = comsig->ev_signal;
5092b7579f77SDag-Erling Smørgrav 	comsig->ev_signal = entry;
5093b7579f77SDag-Erling Smørgrav 	return 1;
5094b7579f77SDag-Erling Smørgrav }
5095b7579f77SDag-Erling Smørgrav 
5096b7579f77SDag-Erling Smørgrav void
5097b7579f77SDag-Erling Smørgrav comm_signal_delete(struct comm_signal* comsig)
5098b7579f77SDag-Erling Smørgrav {
5099b7579f77SDag-Erling Smørgrav 	struct internal_signal* p, *np;
5100b7579f77SDag-Erling Smørgrav 	if(!comsig)
5101b7579f77SDag-Erling Smørgrav 		return;
5102b7579f77SDag-Erling Smørgrav 	p=comsig->ev_signal;
5103b7579f77SDag-Erling Smørgrav 	while(p) {
5104b7579f77SDag-Erling Smørgrav 		np = p->next;
5105e2d15004SDag-Erling Smørgrav 		ub_signal_del(p->ev);
5106e2d15004SDag-Erling Smørgrav 		ub_event_free(p->ev);
5107b7579f77SDag-Erling Smørgrav 		free(p);
5108b7579f77SDag-Erling Smørgrav 		p = np;
5109b7579f77SDag-Erling Smørgrav 	}
5110b7579f77SDag-Erling Smørgrav 	free(comsig);
5111b7579f77SDag-Erling Smørgrav }
5112