979ee0
From 9e2b0c4b026f281507d1879da8398841270bc20f Mon Sep 17 00:00:00 2001
979ee0
From: Christian Heimes <cheimes@redhat.com>
979ee0
Date: Fri, 15 Jun 2018 17:03:29 +0200
979ee0
Subject: [PATCH] Sort and shuffle SRV record by priority and weight
979ee0
979ee0
On multiple occasions, SRV query answers were not properly sorted by
979ee0
priority. Records with same priority weren't randomized and shuffled.
979ee0
This caused FreeIPA to contact the same remote peer instead of
979ee0
distributing the load across all available servers.
979ee0
979ee0
Two new helper functions now take care of SRV queries. sort_prio_weight()
979ee0
sorts SRV and URI records. query_srv() combines SRV lookup with
979ee0
sort_prio_weight().
979ee0
979ee0
Fixes: https://pagure.io/freeipa/issue/7475
979ee0
Signed-off-by: Christian Heimes <cheimes@redhat.com>
979ee0
Reviewed-By: Rob Crittenden <rcritten@redhat.com>
979ee0
---
979ee0
 ipaclient/install/ipadiscovery.py       |   3 +-
979ee0
 ipalib/rpc.py                           |  21 ++---
979ee0
 ipalib/util.py                          |  11 ++-
979ee0
 ipapython/config.py                     |   8 +-
979ee0
 ipapython/dnsutil.py                    |  92 +++++++++++++++++++-
979ee0
 ipaserver/dcerpc.py                     |   4 +-
979ee0
 ipatests/test_ipapython/test_dnsutil.py | 106 ++++++++++++++++++++++++
979ee0
 7 files changed, 217 insertions(+), 28 deletions(-)
979ee0
 create mode 100644 ipatests/test_ipapython/test_dnsutil.py
979ee0
979ee0
diff --git a/ipaclient/install/ipadiscovery.py b/ipaclient/install/ipadiscovery.py
979ee0
index 46e05c971647b4f0fb4e6044ef74aff3e7919632..34142179a9f4957e842769d9d4036d2024130793 100644
979ee0
--- a/ipaclient/install/ipadiscovery.py
979ee0
+++ b/ipaclient/install/ipadiscovery.py
979ee0
@@ -25,6 +25,7 @@ from ipapython.ipa_log_manager import root_logger
979ee0
 from dns import resolver, rdatatype
979ee0
 from dns.exception import DNSException
979ee0
 from ipalib import errors
979ee0
+from ipapython.dnsutil import query_srv
979ee0
 from ipapython import ipaldap
979ee0
 from ipaplatform.paths import paths
979ee0
 from ipapython.ipautil import valid_ip, realm_to_suffix
979ee0
@@ -492,7 +493,7 @@ class IPADiscovery(object):
979ee0
         root_logger.debug("Search DNS for SRV record of %s", qname)
979ee0
 
979ee0
         try:
979ee0
-            answers = resolver.query(qname, rdatatype.SRV)
979ee0
+            answers = query_srv(qname)
979ee0
         except DNSException as e:
979ee0
             root_logger.debug("DNS record not found: %s", e.__class__.__name__)
979ee0
             answers = []
979ee0
diff --git a/ipalib/rpc.py b/ipalib/rpc.py
979ee0
index e3b8d67d69c084ad1a43390b5f93061826a27e1d..e74807d57955cd36aa8622b4441e08ee89cd313e 100644
979ee0
--- a/ipalib/rpc.py
979ee0
+++ b/ipalib/rpc.py
979ee0
@@ -43,7 +43,6 @@ import socket
979ee0
 import gzip
979ee0
 
979ee0
 import gssapi
979ee0
-from dns import resolver, rdatatype
979ee0
 from dns.exception import DNSException
979ee0
 from ssl import SSLError
979ee0
 import six
979ee0
@@ -59,7 +58,7 @@ from ipapython.ipa_log_manager import root_logger
979ee0
 from ipapython import ipautil
979ee0
 from ipapython import session_storage
979ee0
 from ipapython.cookie import Cookie
979ee0
-from ipapython.dnsutil import DNSName
979ee0
+from ipapython.dnsutil import DNSName, query_srv
979ee0
 from ipalib.text import _
979ee0
 from ipalib.util import create_https_connection
979ee0
 from ipalib.krb_utils import KRB5KDC_ERR_S_PRINCIPAL_UNKNOWN, KRB5KRB_AP_ERR_TKT_EXPIRED, \
979ee0
@@ -853,7 +852,7 @@ class RPCClient(Connectible):
979ee0
         name = '_ldap._tcp.%s.' % self.env.domain
979ee0
 
979ee0
         try:
979ee0
-            answers = resolver.query(name, rdatatype.SRV)
979ee0
+            answers = query_srv(name)
979ee0
         except DNSException:
979ee0
             answers = []
979ee0
 
979ee0
@@ -861,17 +860,11 @@ class RPCClient(Connectible):
979ee0
             server = str(answer.target).rstrip(".")
979ee0
             servers.append('https://%s%s' % (ipautil.format_netloc(server), path))
979ee0
 
979ee0
-        servers = list(set(servers))
979ee0
-        # the list/set conversion won't preserve order so stick in the
979ee0
-        # local config file version here.
979ee0
-        cfg_server = rpc_uri
979ee0
-        if cfg_server in servers:
979ee0
-            # make sure the configured master server is there just once and
979ee0
-            # it is the first one
979ee0
-            servers.remove(cfg_server)
979ee0
-            servers.insert(0, cfg_server)
979ee0
-        else:
979ee0
-            servers.insert(0, cfg_server)
979ee0
+        # make sure the configured master server is there just once and
979ee0
+        # it is the first one.
979ee0
+        if rpc_uri in servers:
979ee0
+            servers.remove(rpc_uri)
979ee0
+        servers.insert(0, rpc_uri)
979ee0
 
979ee0
         return servers
979ee0
 
979ee0
diff --git a/ipalib/util.py b/ipalib/util.py
979ee0
index 6ee65498b4de674fe4b2ee361541d3bfe648bba0..56db48638e8319859850fba449ed7c23b6e909ab 100644
979ee0
--- a/ipalib/util.py
979ee0
+++ b/ipalib/util.py
979ee0
@@ -934,14 +934,13 @@ def detect_dns_zone_realm_type(api, domain):
979ee0
 
979ee0
     try:
979ee0
         # The presence of this record is enough, return foreign in such case
979ee0
-        result = resolver.query(ad_specific_record_name, rdatatype.SRV)
979ee0
-        return 'foreign'
979ee0
-
979ee0
+        resolver.query(ad_specific_record_name, rdatatype.SRV)
979ee0
     except DNSException:
979ee0
-        pass
979ee0
+        # If we could not detect type with certainty, return unknown
979ee0
+        return 'unknown'
979ee0
+    else:
979ee0
+        return 'foreign'
979ee0
 
979ee0
-    # If we could not detect type with certainity, return unknown
979ee0
-    return 'unknown'
979ee0
 
979ee0
 def has_managed_topology(api):
979ee0
     domainlevel = api.Command['domainlevel_get']().get('result', DOMAIN_LEVEL_0)
979ee0
diff --git a/ipapython/config.py b/ipapython/config.py
979ee0
index 19abfc51ee354d2971be836fa6bad70eea3a6720..44c823b6b946c28a510e5f156061eba0b05aa059 100644
979ee0
--- a/ipapython/config.py
979ee0
+++ b/ipapython/config.py
979ee0
@@ -24,7 +24,6 @@ from optparse import (
979ee0
 from copy import copy
979ee0
 import socket
979ee0
 
979ee0
-from dns import resolver, rdatatype
979ee0
 from dns.exception import DNSException
979ee0
 import dns.name
979ee0
 # pylint: disable=import-error
979ee0
@@ -33,6 +32,7 @@ from six.moves.urllib.parse import urlsplit
979ee0
 # pylint: enable=import-error
979ee0
 
979ee0
 from ipapython.dn import DN
979ee0
+from ipapython.dnsutil import query_srv
979ee0
 
979ee0
 try:
979ee0
     # pylint: disable=ipa-forbidden-import
979ee0
@@ -195,7 +195,7 @@ def __discover_config(discover_server = True):
979ee0
             name = "_ldap._tcp." + domain
979ee0
 
979ee0
             try:
979ee0
-                servers = resolver.query(name, rdatatype.SRV)
979ee0
+                servers = query_srv(name)
979ee0
             except DNSException:
979ee0
                 # try cycling on domain components of FQDN
979ee0
                 try:
979ee0
@@ -210,7 +210,7 @@ def __discover_config(discover_server = True):
979ee0
                         return False
979ee0
                     name = "_ldap._tcp.%s" % domain
979ee0
                     try:
979ee0
-                        servers = resolver.query(name, rdatatype.SRV)
979ee0
+                        servers = query_srv(name)
979ee0
                         break
979ee0
                     except DNSException:
979ee0
                         pass
979ee0
@@ -221,7 +221,7 @@ def __discover_config(discover_server = True):
979ee0
             if not servers:
979ee0
                 name = "_ldap._tcp.%s." % config.default_domain
979ee0
                 try:
979ee0
-                    servers = resolver.query(name, rdatatype.SRV)
979ee0
+                    servers = query_srv(name)
979ee0
                 except DNSException:
979ee0
                     pass
979ee0
 
979ee0
diff --git a/ipapython/dnsutil.py b/ipapython/dnsutil.py
979ee0
index 011b722dac3e181ac52f7d92d9f44d31c5e2e6bb..25435ba51e6e7c2c6581b60eb077dd133dd29724 100644
979ee0
--- a/ipapython/dnsutil.py
979ee0
+++ b/ipapython/dnsutil.py
979ee0
@@ -17,10 +17,15 @@
979ee0
 # along with this program.  If not, see <http://www.gnu.org/licenses/>.
979ee0
 #
979ee0
 
979ee0
+import copy
979ee0
+import operator
979ee0
+import random
979ee0
+
979ee0
 import dns.name
979ee0
 import dns.exception
979ee0
 import dns.resolver
979ee0
-import copy
979ee0
+import dns.rdataclass
979ee0
+import dns.rdatatype
979ee0
 
979ee0
 import six
979ee0
 
979ee0
@@ -369,3 +374,88 @@ def check_zone_overlap(zone, raise_on_error=True):
979ee0
         if ns:
979ee0
             msg += u" and is handled by server(s): {0}".format(', '.join(ns))
979ee0
         raise ValueError(msg)
979ee0
+
979ee0
+
979ee0
+def _mix_weight(records):
979ee0
+    """Weighted population sorting for records with same priority
979ee0
+    """
979ee0
+    # trivial case
979ee0
+    if len(records) <= 1:
979ee0
+        return records
979ee0
+
979ee0
+    # Optimization for common case: If all weights are the same (e.g. 0),
979ee0
+    # just shuffle the records, which is about four times faster.
979ee0
+    if all(rr.weight == records[0].weight for rr in records):
979ee0
+        random.shuffle(records)
979ee0
+        return records
979ee0
+
979ee0
+    noweight = 0.01  # give records with 0 weight a small chance
979ee0
+    result = []
979ee0
+    records = set(records)
979ee0
+    while len(records) > 1:
979ee0
+        # Compute the sum of the weights of those RRs. Then choose a
979ee0
+        # uniform random number between 0 and the sum computed (inclusive).
979ee0
+        urn = random.uniform(0, sum(rr.weight or noweight for rr in records))
979ee0
+        # Select the RR whose running sum value is the first in the selected
979ee0
+        # order which is greater than or equal to the random number selected.
979ee0
+        acc = 0.
979ee0
+        for rr in records.copy():
979ee0
+            acc += rr.weight or noweight
979ee0
+            if acc >= urn:
979ee0
+                records.remove(rr)
979ee0
+                result.append(rr)
979ee0
+    if records:
979ee0
+        result.append(records.pop())
979ee0
+    return result
979ee0
+
979ee0
+
979ee0
+def sort_prio_weight(records):
979ee0
+    """RFC 2782 sorting algorithm for SRV and URI records
979ee0
+
979ee0
+    RFC 2782 defines a sorting algorithms for SRV records, that is also used
979ee0
+    for sorting URI records. Records are sorted by priority and than randomly
979ee0
+    shuffled according to weight.
979ee0
+
979ee0
+    This implementation also removes duplicate entries.
979ee0
+    """
979ee0
+    # order records by priority
979ee0
+    records = sorted(records, key=operator.attrgetter("priority"))
979ee0
+
979ee0
+    # remove duplicate entries
979ee0
+    uniquerecords = []
979ee0
+    seen = set()
979ee0
+    for rr in records:
979ee0
+        # A SRV record has target and port, URI just has target.
979ee0
+        target = (rr.target, getattr(rr, "port", None))
979ee0
+        if target not in seen:
979ee0
+            uniquerecords.append(rr)
979ee0
+            seen.add(target)
979ee0
+
979ee0
+    # weighted randomization of entries with same priority
979ee0
+    result = []
979ee0
+    sameprio = []
979ee0
+    for rr in uniquerecords:
979ee0
+        # add all items with same priority in a bucket
979ee0
+        if not sameprio or sameprio[0].priority == rr.priority:
979ee0
+            sameprio.append(rr)
979ee0
+        else:
979ee0
+            # got different priority, shuffle bucket
979ee0
+            result.extend(_mix_weight(sameprio))
979ee0
+            # start a new priority list
979ee0
+            sameprio = [rr]
979ee0
+    # add last batch of records with same priority
979ee0
+    if sameprio:
979ee0
+        result.extend(_mix_weight(sameprio))
979ee0
+    return result
979ee0
+
979ee0
+
979ee0
+def query_srv(qname, resolver=None, **kwargs):
979ee0
+    """Query SRV records and sort reply according to RFC 2782
979ee0
+
979ee0
+    :param qname: query name, _service._proto.domain.
979ee0
+    :return: list of dns.rdtypes.IN.SRV.SRV instances
979ee0
+    """
979ee0
+    if resolver is None:
979ee0
+        resolver = dns.resolver
979ee0
+    answer = resolver.query(qname, rdtype=dns.rdatatype.SRV, **kwargs)
979ee0
+    return sort_prio_weight(answer)
979ee0
diff --git a/ipaserver/dcerpc.py b/ipaserver/dcerpc.py
979ee0
index ac1b2a34784df491a3851aa21bbadbec2297241c..4e957b19292f51a7f6e3540dc38590737c7ae5e4 100644
979ee0
--- a/ipaserver/dcerpc.py
979ee0
+++ b/ipaserver/dcerpc.py
979ee0
@@ -30,6 +30,7 @@ from ipalib import errors
979ee0
 from ipapython import ipautil
979ee0
 from ipapython.ipa_log_manager import root_logger
979ee0
 from ipapython.dn import DN
979ee0
+from ipapython.dnsutil import query_srv
979ee0
 from ipaserver.install import installutils
979ee0
 from ipaserver.dcerpc_common import (TRUST_BIDIRECTIONAL,
979ee0
                                      TRUST_JOIN_EXTERNAL,
979ee0
@@ -55,7 +56,6 @@ import samba
979ee0
 import ldap as _ldap
979ee0
 from ipapython import ipaldap
979ee0
 from ipapython.dnsutil import DNSName
979ee0
-from dns import resolver, rdatatype
979ee0
 from dns.exception import DNSException
979ee0
 import pysss_nss_idmap
979ee0
 import pysss
979ee0
@@ -795,7 +795,7 @@ class DomainValidator(object):
979ee0
             gc_name = '_gc._tcp.%s.' % info['dns_domain']
979ee0
 
979ee0
             try:
979ee0
-                answers = resolver.query(gc_name, rdatatype.SRV)
979ee0
+                answers = query_srv(gc_name)
979ee0
             except DNSException as e:
979ee0
                 answers = []
979ee0
 
979ee0
diff --git a/ipatests/test_ipapython/test_dnsutil.py b/ipatests/test_ipapython/test_dnsutil.py
979ee0
new file mode 100644
979ee0
index 0000000000000000000000000000000000000000..36adb077cf38f6d036aa1048b201dee7d08eb310
979ee0
--- /dev/null
979ee0
+++ b/ipatests/test_ipapython/test_dnsutil.py
979ee0
@@ -0,0 +1,106 @@
979ee0
+#
979ee0
+# Copyright (C) 2018  FreeIPA Contributors.  See COPYING for license
979ee0
+#
979ee0
+import dns.name
979ee0
+import dns.rdataclass
979ee0
+import dns.rdatatype
979ee0
+from dns.rdtypes.IN.SRV import SRV
979ee0
+from dns.rdtypes.ANY.URI import URI
979ee0
+
979ee0
+from ipapython import dnsutil
979ee0
+
979ee0
+import pytest
979ee0
+
979ee0
+
979ee0
+def mksrv(priority, weight, port, target):
979ee0
+    return SRV(
979ee0
+        rdclass=dns.rdataclass.IN,
979ee0
+        rdtype=dns.rdatatype.SRV,
979ee0
+        priority=priority,
979ee0
+        weight=weight,
979ee0
+        port=port,
979ee0
+        target=dns.name.from_text(target)
979ee0
+    )
979ee0
+
979ee0
+
979ee0
+def mkuri(priority, weight, target):
979ee0
+    return URI(
979ee0
+        rdclass=dns.rdataclass.IN,
979ee0
+        rdtype=dns.rdatatype.URI,
979ee0
+        priority=priority,
979ee0
+        weight=weight,
979ee0
+        target=target
979ee0
+    )
979ee0
+
979ee0
+
979ee0
+class TestSortSRV(object):
979ee0
+    def test_empty(self):
979ee0
+        assert dnsutil.sort_prio_weight([]) == []
979ee0
+
979ee0
+    def test_one(self):
979ee0
+        h1 = mksrv(1, 0, 443, u"host1")
979ee0
+        assert dnsutil.sort_prio_weight([h1]) == [h1]
979ee0
+
979ee0
+        h2 = mksrv(10, 5, 443, u"host2")
979ee0
+        assert dnsutil.sort_prio_weight([h2]) == [h2]
979ee0
+
979ee0
+    def test_prio(self):
979ee0
+        h1 = mksrv(1, 0, 443, u"host1")
979ee0
+        h2 = mksrv(2, 0, 443, u"host2")
979ee0
+        h3 = mksrv(3, 0, 443, u"host3")
979ee0
+        assert dnsutil.sort_prio_weight([h3, h2, h1]) == [h1, h2, h3]
979ee0
+        assert dnsutil.sort_prio_weight([h3, h3, h3]) == [h3]
979ee0
+        assert dnsutil.sort_prio_weight([h2, h2, h1, h1]) == [h1, h2]
979ee0
+
979ee0
+        h380 = mksrv(4, 0, 80, u"host3")
979ee0
+        assert dnsutil.sort_prio_weight([h1, h3, h380]) == [h1, h3, h380]
979ee0
+
979ee0
+        hs = mksrv(-1, 0, 443, u"special")
979ee0
+        assert dnsutil.sort_prio_weight([h1, h2, hs]) == [hs, h1, h2]
979ee0
+
979ee0
+    def assert_permutations(self, answers, permutations):
979ee0
+        seen = set()
979ee0
+        for _unused in range(1000):
979ee0
+            result = tuple(dnsutil.sort_prio_weight(answers))
979ee0
+            assert result in permutations
979ee0
+            seen.add(result)
979ee0
+            if seen == permutations:
979ee0
+                break
979ee0
+        else:
979ee0
+            pytest.fail("sorting didn't exhaust all permutations.")
979ee0
+
979ee0
+    def test_sameprio(self):
979ee0
+        h1 = mksrv(1, 0, 443, u"host1")
979ee0
+        h2 = mksrv(1, 0, 443, u"host2")
979ee0
+        permutations = {
979ee0
+            (h1, h2),
979ee0
+            (h2, h1),
979ee0
+        }
979ee0
+        self.assert_permutations([h1, h2], permutations)
979ee0
+
979ee0
+    def test_weight(self):
979ee0
+        h1 = mksrv(1, 0, 443, u"host1")
979ee0
+        h2_w15 = mksrv(2, 15, 443, u"host2")
979ee0
+        h3_w10 = mksrv(2, 10, 443, u"host3")
979ee0
+
979ee0
+        permutations = {
979ee0
+            (h1, h2_w15, h3_w10),
979ee0
+            (h1, h3_w10, h2_w15),
979ee0
+        }
979ee0
+        self.assert_permutations([h1, h2_w15, h3_w10], permutations)
979ee0
+
979ee0
+    def test_large(self):
979ee0
+        records = tuple(
979ee0
+            mksrv(1, i, 443, "host{}".format(i)) for i in range(1000)
979ee0
+        )
979ee0
+        assert len(dnsutil.sort_prio_weight(records)) == len(records)
979ee0
+
979ee0
+
979ee0
+class TestSortURI(object):
979ee0
+    def test_prio(self):
979ee0
+        h1 = mkuri(1, 0, u"https://host1/api")
979ee0
+        h2 = mkuri(2, 0, u"https://host2/api")
979ee0
+        h3 = mkuri(3, 0, u"https://host3/api")
979ee0
+        assert dnsutil.sort_prio_weight([h3, h2, h1]) == [h1, h2, h3]
979ee0
+        assert dnsutil.sort_prio_weight([h3, h3, h3]) == [h3]
979ee0
+        assert dnsutil.sort_prio_weight([h2, h2, h1, h1]) == [h1, h2]
979ee0
-- 
979ee0
2.17.1
979ee0