272df6
From f34cc4f62cd6730fc315ace47b9ae90a82a07ec0 Mon Sep 17 00:00:00 2001
272df6
From: Mark Andrews <marka@isc.org>
272df6
Date: Thu, 4 Sep 2014 10:37:45 +1000
272df6
Subject: [PATCH] 3939. [func] Improve UPDATE forwarding performance by
272df6
 allowing TCP connections to be shared. [RT #37039]
272df6
272df6
(cherry picked from commit 74717eef53ba5d6aefc80eb262bbb090ff4bb3b5)
272df6
---
272df6
 lib/dns/dispatch.c             | 112 ++++++++++++++++++++++++++++++++-
272df6
 lib/dns/include/dns/dispatch.h |  15 +++++
272df6
 lib/dns/request.c              |  46 ++++++++++----
272df6
 lib/dns/win32/libdns.def       |   2 +
272df6
 4 files changed, 159 insertions(+), 16 deletions(-)
272df6
272df6
diff --git a/lib/dns/dispatch.c b/lib/dns/dispatch.c
272df6
index c93651d..ee82241 100644
272df6
--- a/lib/dns/dispatch.c
272df6
+++ b/lib/dns/dispatch.c
272df6
@@ -228,6 +228,7 @@ struct dns_dispatch {
272df6
 	isc_socket_t	       *socket;		/*%< isc socket attached to */
272df6
 	isc_sockaddr_t		local;		/*%< local address */
272df6
 	in_port_t		localport;	/*%< local UDP port */
272df6
+	isc_sockaddr_t		peer;		/*%< peer address (TCP) */
272df6
 	unsigned int		maxrequests;	/*%< max requests */
272df6
 	isc_event_t	       *ctlevent;
272df6
 
272df6
@@ -2327,7 +2328,6 @@ dns_dispatchmgr_destroy(dns_dispatchmgr_t **mgrp) {
272df6
 
272df6
 	LOCK(&mgr->lock);
272df6
 	mgr->state |= MGR_SHUTTINGDOWN;
272df6
-
272df6
 	killit = destroy_mgr_ok(mgr);
272df6
 	UNLOCK(&mgr->lock);
272df6
 
272df6
@@ -2601,6 +2601,7 @@ dispatch_allocate(dns_dispatchmgr_t *mgr, unsigned int maxrequests,
272df6
 	disp->refcount = 1;
272df6
 	disp->recv_pending = 0;
272df6
 	memset(&disp->local, 0, sizeof(disp->local));
272df6
+	memset(&disp->peer, 0, sizeof(disp->peer));
272df6
 	disp->localport = 0;
272df6
 	disp->shutting_down = 0;
272df6
 	disp->shutdown_out = 0;
272df6
@@ -2702,6 +2703,23 @@ dns_dispatch_createtcp(dns_dispatchmgr_t *mgr, isc_socket_t *sock,
272df6
 		       unsigned int buckets, unsigned int increment,
272df6
 		       unsigned int attributes, dns_dispatch_t **dispp)
272df6
 {
272df6
+
272df6
+	attributes |= DNS_DISPATCHATTR_PRIVATE;  /* XXXMLG */
272df6
+
272df6
+	return (dns_dispatch_createtcp2(mgr, sock, taskmgr, NULL, NULL,
272df6
+					buffersize, maxbuffers, maxrequests,
272df6
+					buckets, increment, attributes,
272df6
+					dispp));
272df6
+}
272df6
+
272df6
+isc_result_t
272df6
+dns_dispatch_createtcp2(dns_dispatchmgr_t *mgr, isc_socket_t *sock,
272df6
+		        isc_taskmgr_t *taskmgr, isc_sockaddr_t *localaddr,
272df6
+			isc_sockaddr_t *destaddr, unsigned int buffersize,
272df6
+		        unsigned int maxbuffers, unsigned int maxrequests,
272df6
+		        unsigned int buckets, unsigned int increment,
272df6
+		        unsigned int attributes, dns_dispatch_t **dispp)
272df6
+{
272df6
 	isc_result_t result;
272df6
 	dns_dispatch_t *disp;
272df6
 
272df6
@@ -2713,7 +2731,8 @@ dns_dispatch_createtcp(dns_dispatchmgr_t *mgr, isc_socket_t *sock,
272df6
 	REQUIRE((attributes & DNS_DISPATCHATTR_TCP) != 0);
272df6
 	REQUIRE((attributes & DNS_DISPATCHATTR_UDP) == 0);
272df6
 
272df6
-	attributes |= DNS_DISPATCHATTR_PRIVATE;  /* XXXMLG */
272df6
+	if (destaddr == NULL)
272df6
+		attributes |= DNS_DISPATCHATTR_PRIVATE;  /* XXXMLG */
272df6
 
272df6
 	LOCK(&mgr->lock);
272df6
 
272df6
@@ -2760,6 +2779,23 @@ dns_dispatch_createtcp(dns_dispatchmgr_t *mgr, isc_socket_t *sock,
272df6
 
272df6
 	disp->attributes = attributes;
272df6
 
272df6
+	if (localaddr == NULL) {
272df6
+		if (destaddr != NULL) {
272df6
+			switch (isc_sockaddr_pf(destaddr)) {
272df6
+			case AF_INET:
272df6
+				isc_sockaddr_any(&disp->local);
272df6
+				break;
272df6
+			case AF_INET6:
272df6
+				isc_sockaddr_any6(&disp->local);
272df6
+				break;
272df6
+			}
272df6
+		}
272df6
+	} else
272df6
+		disp->local = *localaddr;
272df6
+
272df6
+	if (destaddr != NULL)
272df6
+		disp->peer = *destaddr;
272df6
+
272df6
 	/*
272df6
 	 * Append it to the dispatcher list.
272df6
 	 */
272df6
@@ -2768,7 +2804,6 @@ dns_dispatch_createtcp(dns_dispatchmgr_t *mgr, isc_socket_t *sock,
272df6
 
272df6
 	mgr_log(mgr, LVL(90), "created TCP dispatcher %p", disp);
272df6
 	dispatch_log(disp, LVL(90), "created task %p", disp->task[0]);
272df6
-
272df6
 	*dispp = disp;
272df6
 
272df6
 	return (ISC_R_SUCCESS);
272df6
@@ -2788,6 +2823,77 @@ dns_dispatch_createtcp(dns_dispatchmgr_t *mgr, isc_socket_t *sock,
272df6
 	return (result);
272df6
 }
272df6
 
272df6
+isc_result_t
272df6
+dns_dispatch_gettcp(dns_dispatchmgr_t *mgr, isc_sockaddr_t *destaddr,
272df6
+		    isc_sockaddr_t *localaddr, dns_dispatch_t **dispp)
272df6
+{
272df6
+#ifdef BIND9
272df6
+	dns_dispatch_t *disp;
272df6
+	isc_result_t result;
272df6
+	isc_sockaddr_t peeraddr;
272df6
+	isc_sockaddr_t sockname;
272df6
+	isc_sockaddr_t any;
272df6
+	unsigned int attributes, mask;
272df6
+	isc_boolean_t match = ISC_FALSE;
272df6
+
272df6
+	REQUIRE(VALID_DISPATCHMGR(mgr));
272df6
+	REQUIRE(destaddr != NULL);
272df6
+	REQUIRE(dispp != NULL && *dispp == NULL);
272df6
+
272df6
+	attributes = DNS_DISPATCHATTR_TCP;
272df6
+	mask = DNS_DISPATCHATTR_TCP | DNS_DISPATCHATTR_PRIVATE |
272df6
+	       DNS_DISPATCHATTR_EXCLUSIVE;
272df6
+
272df6
+	if (localaddr == NULL) {
272df6
+		switch (isc_sockaddr_pf(destaddr)) {
272df6
+		case AF_INET:
272df6
+			isc_sockaddr_any(&any;;
272df6
+			break;
272df6
+		case AF_INET6:
272df6
+			isc_sockaddr_any6(&any;;
272df6
+			break;
272df6
+		default:
272df6
+			return (ISC_R_NOTFOUND);
272df6
+		}
272df6
+		localaddr = &any;
272df6
+	}
272df6
+
272df6
+	LOCK(&mgr->lock);
272df6
+	disp = ISC_LIST_HEAD(mgr->list);
272df6
+	while (disp != NULL && !match) {
272df6
+		LOCK(&disp->lock);
272df6
+		if ((disp->shutting_down == 0) &&
272df6
+		    ATTRMATCH(disp->attributes, attributes, mask) &&
272df6
+		    (localaddr == NULL ||
272df6
+		     isc_sockaddr_eqaddr(localaddr, &disp->local))) {
272df6
+			result = isc_socket_getsockname(disp->socket,
272df6
+							&sockname);
272df6
+			if (result == ISC_R_SUCCESS)
272df6
+				result = isc_socket_getpeername(disp->socket,
272df6
+								&peeraddr);
272df6
+			if (result == ISC_R_SUCCESS &&
272df6
+			    isc_sockaddr_equal(destaddr, &peeraddr) &&
272df6
+			    isc_sockaddr_eqaddr(localaddr, &sockname)) {
272df6
+				/* attach */
272df6
+				disp->refcount++;
272df6
+				*dispp = disp;
272df6
+				match = ISC_TRUE;
272df6
+			}
272df6
+		}
272df6
+		UNLOCK(&disp->lock);
272df6
+		disp = ISC_LIST_NEXT(disp, link);
272df6
+	}
272df6
+	UNLOCK(&mgr->lock);
272df6
+	return (match ? ISC_R_SUCCESS : ISC_R_NOTFOUND);
272df6
+#else
272df6
+	UNUSED(mgr);
272df6
+	UNUSED(destaddr);
272df6
+	UNUSED(localaddr);
272df6
+	UNUSED(dispp);
272df6
+	return ISC_R_NOTIMPLEMENTED;
272df6
+#endif
272df6
+}
272df6
+
272df6
 isc_result_t
272df6
 dns_dispatch_getudp_dup(dns_dispatchmgr_t *mgr, isc_socketmgr_t *sockmgr,
272df6
 		    isc_taskmgr_t *taskmgr, isc_sockaddr_t *localaddr,
272df6
diff --git a/lib/dns/include/dns/dispatch.h b/lib/dns/include/dns/dispatch.h
272df6
index 1235f7c..be9cd66 100644
272df6
--- a/lib/dns/include/dns/dispatch.h
272df6
+++ b/lib/dns/include/dns/dispatch.h
272df6
@@ -298,6 +298,13 @@ dns_dispatch_createtcp(dns_dispatchmgr_t *mgr, isc_socket_t *sock,
272df6
 		       unsigned int maxbuffers, unsigned int maxrequests,
272df6
 		       unsigned int buckets, unsigned int increment,
272df6
 		       unsigned int attributes, dns_dispatch_t **dispp);
272df6
+isc_result_t
272df6
+dns_dispatch_createtcp2(dns_dispatchmgr_t *mgr, isc_socket_t *sock,
272df6
+                        isc_taskmgr_t *taskmgr, isc_sockaddr_t *localaddr,
272df6
+                        isc_sockaddr_t *destaddr, unsigned int buffersize,
272df6
+                        unsigned int maxbuffers, unsigned int maxrequests,
272df6
+                        unsigned int buckets, unsigned int increment,
272df6
+                        unsigned int attributes, dns_dispatch_t **dispp);
272df6
 /*%<
272df6
  * Create a new dns_dispatch and attach it to the provided isc_socket_t.
272df6
  *
272df6
@@ -369,6 +376,14 @@ dns_dispatch_starttcp(dns_dispatch_t *disp);
272df6
  *\li	'disp' is valid.
272df6
  */
272df6
 
272df6
+isc_result_t
272df6
+dns_dispatch_gettcp(dns_dispatchmgr_t *mgr, isc_sockaddr_t *destaddr,
272df6
+                    isc_sockaddr_t *localaddr, dns_dispatch_t **dispp);
272df6
+/*
272df6
+ * Attempt to connect to a existing TCP connection.
272df6
+ */
272df6
+
272df6
+
272df6
 isc_result_t
272df6
 dns_dispatch_addresponse2(dns_dispatch_t *disp, isc_sockaddr_t *dest,
272df6
 			  isc_task_t *task, isc_taskaction_t action, void *arg,
272df6
diff --git a/lib/dns/request.c b/lib/dns/request.c
272df6
index 5c76f9a..9fb6f44 100644
272df6
--- a/lib/dns/request.c
272df6
+++ b/lib/dns/request.c
272df6
@@ -510,7 +510,8 @@ isblackholed(dns_dispatchmgr_t *dispatchmgr, isc_sockaddr_t *destaddr) {
272df6
 
272df6
 static isc_result_t
272df6
 create_tcp_dispatch(dns_requestmgr_t *requestmgr, isc_sockaddr_t *srcaddr,
272df6
-		    isc_sockaddr_t *destaddr, dns_dispatch_t **dispatchp)
272df6
+		    isc_sockaddr_t *destaddr, isc_boolean_t *connected,
272df6
+		    dns_dispatch_t **dispatchp)
272df6
 {
272df6
 	isc_result_t result;
272df6
 	isc_socket_t *socket = NULL;
272df6
@@ -518,6 +519,20 @@ create_tcp_dispatch(dns_requestmgr_t *requestmgr, isc_sockaddr_t *srcaddr,
272df6
 	unsigned int attrs;
272df6
 	isc_sockaddr_t bind_any;
272df6
 
272df6
+	*connected = ISC_FALSE;
272df6
+#ifdef BIND9
272df6
+	result = dns_dispatch_gettcp(requestmgr->dispatchmgr, destaddr,
272df6
+				     srcaddr, dispatchp);
272df6
+	if (result == ISC_R_SUCCESS) {
272df6
+		*connected = ISC_TRUE;
272df6
+		char peer[ISC_SOCKADDR_FORMATSIZE];
272df6
+		isc_sockaddr_format(destaddr, peer, sizeof(peer));
272df6
+		req_log(ISC_LOG_DEBUG(1), "attached to existing TCP "
272df6
+			"connection to %s", peer);
272df6
+		return (result);
272df6
+	}
272df6
+#endif
272df6
+
272df6
 	result = isc_socket_create(requestmgr->socketmgr,
272df6
 				   isc_sockaddr_pf(destaddr),
272df6
 				   isc_sockettype_tcp, &socket);
272df6
@@ -538,16 +553,16 @@ create_tcp_dispatch(dns_requestmgr_t *requestmgr, isc_sockaddr_t *srcaddr,
272df6
 #endif
272df6
 	attrs = 0;
272df6
 	attrs |= DNS_DISPATCHATTR_TCP;
272df6
-	attrs |= DNS_DISPATCHATTR_PRIVATE;
272df6
 	if (isc_sockaddr_pf(destaddr) == AF_INET)
272df6
 		attrs |= DNS_DISPATCHATTR_IPV4;
272df6
 	else
272df6
 		attrs |= DNS_DISPATCHATTR_IPV6;
272df6
 	attrs |= DNS_DISPATCHATTR_MAKEQUERY;
272df6
-	result = dns_dispatch_createtcp(requestmgr->dispatchmgr,
272df6
-					socket, requestmgr->taskmgr,
272df6
-					4096, 2, 1, 1, 3, attrs,
272df6
-					dispatchp);
272df6
+	result = dns_dispatch_createtcp2(requestmgr->dispatchmgr,
272df6
+					 socket, requestmgr->taskmgr,
272df6
+					 srcaddr, destaddr,
272df6
+					 4096, 32768, 32768, 16411, 16433,
272df6
+					 attrs, dispatchp);
272df6
 cleanup:
272df6
 	isc_socket_detach(&socket);
272df6
 	return (result);
272df6
@@ -609,12 +624,15 @@ find_udp_dispatch(dns_requestmgr_t *requestmgr, isc_sockaddr_t *srcaddr,
272df6
 static isc_result_t
272df6
 get_dispatch(isc_boolean_t tcp, dns_requestmgr_t *requestmgr,
272df6
 	     isc_sockaddr_t *srcaddr, isc_sockaddr_t *destaddr,
272df6
+	     isc_boolean_t *connected,
272df6
 	     dns_dispatch_t **dispatchp)
272df6
 {
272df6
 	isc_result_t result;
272df6
+
272df6
 	if (tcp)
272df6
 		result = create_tcp_dispatch(requestmgr, srcaddr,
272df6
-					     destaddr, dispatchp);
272df6
+					     destaddr, connected,
272df6
+					     dispatchp);
272df6
 	else
272df6
 		result = find_udp_dispatch(requestmgr, srcaddr,
272df6
 					   destaddr, dispatchp);
272df6
@@ -686,6 +704,7 @@ dns_request_createraw3(dns_requestmgr_t *requestmgr, isc_buffer_t *msgbuf,
272df6
 	dns_messageid_t	id;
272df6
 	isc_boolean_t tcp = ISC_FALSE;
272df6
 	isc_region_t r;
272df6
+	isc_boolean_t connected = ISC_FALSE;
272df6
 
272df6
 	REQUIRE(VALID_REQUESTMGR(requestmgr));
272df6
 	REQUIRE(msgbuf != NULL);
272df6
@@ -747,7 +766,7 @@ dns_request_createraw3(dns_requestmgr_t *requestmgr, isc_buffer_t *msgbuf,
272df6
 		tcp = ISC_TRUE;
272df6
 
272df6
 	result = get_dispatch(tcp, requestmgr, srcaddr, destaddr,
272df6
-			      &request->dispatch);
272df6
+			      &connected, &request->dispatch);
272df6
 	if (result != ISC_R_SUCCESS)
272df6
 		goto cleanup;
272df6
 
272df6
@@ -794,14 +813,14 @@ dns_request_createraw3(dns_requestmgr_t *requestmgr, isc_buffer_t *msgbuf,
272df6
 		goto unlink;
272df6
 
272df6
 	request->destaddr = *destaddr;
272df6
-	if (tcp) {
272df6
+	if (tcp && !connected) {
272df6
 		result = isc_socket_connect(socket, destaddr, task,
272df6
 					    req_connected, request);
272df6
 		if (result != ISC_R_SUCCESS)
272df6
 			goto unlink;
272df6
 		request->flags |= DNS_REQUEST_F_CONNECTING|DNS_REQUEST_F_TCP;
272df6
 	} else {
272df6
-		result = req_send(request, task, destaddr);
272df6
+		result = req_send(request, task, connected ? NULL : destaddr);
272df6
 		if (result != ISC_R_SUCCESS)
272df6
 			goto unlink;
272df6
 	}
272df6
@@ -886,6 +905,7 @@ dns_request_createvia3(dns_requestmgr_t *requestmgr, dns_message_t *message,
272df6
 	dns_messageid_t	id;
272df6
 	isc_boolean_t tcp;
272df6
 	isc_boolean_t setkey = ISC_TRUE;
272df6
+	isc_boolean_t connected = ISC_FALSE;
272df6
 
272df6
 	REQUIRE(VALID_REQUESTMGR(requestmgr));
272df6
 	REQUIRE(message != NULL);
272df6
@@ -944,7 +964,7 @@ dns_request_createvia3(dns_requestmgr_t *requestmgr, dns_message_t *message,
272df6
  use_tcp:
272df6
 	tcp = ISC_TF((options & DNS_REQUESTOPT_TCP) != 0);
272df6
 	result = get_dispatch(tcp, requestmgr, srcaddr, destaddr,
272df6
-			      &request->dispatch);
272df6
+			      &connected, &request->dispatch);
272df6
 	if (result != ISC_R_SUCCESS)
272df6
 		goto cleanup;
272df6
 
272df6
@@ -1000,14 +1020,14 @@ dns_request_createvia3(dns_requestmgr_t *requestmgr, dns_message_t *message,
272df6
 		goto unlink;
272df6
 
272df6
 	request->destaddr = *destaddr;
272df6
-	if (tcp) {
272df6
+	if (tcp && !connected) {
272df6
 		result = isc_socket_connect(socket, destaddr, task,
272df6
 					    req_connected, request);
272df6
 		if (result != ISC_R_SUCCESS)
272df6
 			goto unlink;
272df6
 		request->flags |= DNS_REQUEST_F_CONNECTING|DNS_REQUEST_F_TCP;
272df6
 	} else {
272df6
-		result = req_send(request, task, destaddr);
272df6
+		result = req_send(request, task, connected ? NULL : destaddr);
272df6
 		if (result != ISC_R_SUCCESS)
272df6
 			goto unlink;
272df6
 	}
272df6
diff --git a/lib/dns/win32/libdns.def b/lib/dns/win32/libdns.def
272df6
index 5e20491..9aebe16 100644
272df6
--- a/lib/dns/win32/libdns.def
272df6
+++ b/lib/dns/win32/libdns.def
272df6
@@ -176,9 +176,11 @@ dns_dispatch_attach
272df6
 dns_dispatch_cancel
272df6
 dns_dispatch_changeattributes
272df6
 dns_dispatch_createtcp
272df6
+dns_dispatch_createtcp2
272df6
 dns_dispatch_detach
272df6
 dns_dispatch_getlocaladdress
272df6
 dns_dispatch_getsocket
272df6
+dns_dispatch_gettcp
272df6
 dns_dispatch_getudp
272df6
 dns_dispatch_getudp_dup
272df6
 dns_dispatch_importrecv
272df6
-- 
272df6
2.20.1
272df6