Blame SOURCES/squid-4.11-large-acl.patch

c00279
diff --git a/src/acl/RegexData.cc b/src/acl/RegexData.cc
c00279
index 01a4c12..b5c1679 100644
c00279
--- a/src/acl/RegexData.cc
c00279
+++ b/src/acl/RegexData.cc
c00279
@@ -22,6 +22,7 @@
c00279
 #include "ConfigParser.h"
c00279
 #include "Debug.h"
c00279
 #include "sbuf/List.h"
c00279
+#include "sbuf/Algorithms.h"
c00279
 
c00279
 ACLRegexData::~ACLRegexData()
c00279
 {
c00279
@@ -129,6 +130,18 @@ compileRE(std::list<RegexPattern> &curlist, const char * RE, int flags)
c00279
     return true;
c00279
 }
c00279
 
c00279
+static bool
c00279
+compileRE(std::list<RegexPattern> &curlist, const SBufList &RE, int flags)
c00279
+{
c00279
+	if (RE.empty())
c00279
+		return curlist.empty(); // XXX: old code did this. It looks wrong.
c00279
+	SBuf regexp;
c00279
+	static const SBuf openparen("("), closeparen(")"), separator(")|(");
c00279
+	JoinContainerIntoSBuf(regexp, RE.begin(), RE.end(), separator, openparen,
c00279
+			closeparen);
c00279
+	return compileRE(curlist, regexp.c_str(), flags);
c00279
+}
c00279
+
c00279
 /** Compose and compile one large RE from a set of (small) REs.
c00279
  * The ultimate goal is to have only one RE per ACL so that match() is
c00279
  * called only once per ACL.
c00279
@@ -137,16 +150,11 @@ static int
c00279
 compileOptimisedREs(std::list<RegexPattern> &curlist, const SBufList &sl)
c00279
 {
c00279
     std::list<RegexPattern> newlist;
c00279
-    int numREs = 0;
c00279
+    SBufList accumulatedRE;
c00279
+    int numREs = 0, reSize = 0;
c00279
     int flags = REG_EXTENDED | REG_NOSUB;
c00279
-    int largeREindex = 0;
c00279
-    char largeRE[BUFSIZ];
c00279
-    *largeRE = 0;
c00279
 
c00279
     for (const SBuf & configurationLineWord : sl) {
c00279
-        int RElen;
c00279
-        RElen = configurationLineWord.length();
c00279
-
c00279
         static const SBuf minus_i("-i");
c00279
         static const SBuf plus_i("+i");
c00279
         if (configurationLineWord == minus_i) {
c00279
@@ -155,10 +163,11 @@ compileOptimisedREs(std::list<RegexPattern> &curlist, const SBufList &sl)
c00279
                 debugs(28, 2, "optimisation of -i ... -i" );
c00279
             } else {
c00279
                 debugs(28, 2, "-i" );
c00279
-                if (!compileRE(newlist, largeRE, flags))
c00279
+                if (!compileRE(newlist, accumulatedRE, flags))
c00279
                     return 0;
c00279
                 flags |= REG_ICASE;
c00279
-                largeRE[largeREindex=0] = '\0';
c00279
+                accumulatedRE.clear();
c00279
+                reSize = 0;
c00279
             }
c00279
         } else if (configurationLineWord == plus_i) {
c00279
             if ((flags & REG_ICASE) == 0) {
c00279
@@ -166,37 +175,34 @@ compileOptimisedREs(std::list<RegexPattern> &curlist, const SBufList &sl)
c00279
                 debugs(28, 2, "optimisation of +i ... +i");
c00279
             } else {
c00279
                 debugs(28, 2, "+i");
c00279
-                if (!compileRE(newlist, largeRE, flags))
c00279
+                if (!compileRE(newlist, accumulatedRE, flags))
c00279
                     return 0;
c00279
                 flags &= ~REG_ICASE;
c00279
-                largeRE[largeREindex=0] = '\0';
c00279
+                accumulatedRE.clear();
c00279
+                reSize = 0;
c00279
             }
c00279
-        } else if (RElen + largeREindex + 3 < BUFSIZ-1) {
c00279
+        } else if (reSize < 1024) {
c00279
             debugs(28, 2, "adding RE '" << configurationLineWord << "'");
c00279
-            if (largeREindex > 0) {
c00279
-                largeRE[largeREindex] = '|';
c00279
-                ++largeREindex;
c00279
-            }
c00279
-            largeRE[largeREindex] = '(';
c00279
-            ++largeREindex;
c00279
-            configurationLineWord.copy(largeRE+largeREindex, BUFSIZ-largeREindex);
c00279
-            largeREindex += configurationLineWord.length();
c00279
-            largeRE[largeREindex] = ')';
c00279
-            ++largeREindex;
c00279
-            largeRE[largeREindex] = '\0';
c00279
+            accumulatedRE.push_back(configurationLineWord);
c00279
             ++numREs;
c00279
+            reSize += configurationLineWord.length();
c00279
         } else {
c00279
             debugs(28, 2, "buffer full, generating new optimised RE..." );
c00279
-            if (!compileRE(newlist, largeRE, flags))
c00279
+            accumulatedRE.push_back(configurationLineWord);
c00279
+            if (!compileRE(newlist, accumulatedRE, flags))
c00279
                 return 0;
c00279
-            largeRE[largeREindex=0] = '\0';
c00279
+            accumulatedRE.clear();
c00279
+            reSize = 0;
c00279
             continue;    /* do the loop again to add the RE to largeRE */
c00279
         }
c00279
     }
c00279
 
c00279
-    if (!compileRE(newlist, largeRE, flags))
c00279
+    if (!compileRE(newlist, accumulatedRE, flags))
c00279
         return 0;
c00279
 
c00279
+    accumulatedRE.clear();
c00279
+    reSize = 0;
c00279
+
c00279
     /* all was successful, so put the new list at the tail */
c00279
     curlist.splice(curlist.end(), newlist);
c00279
 
c00279
diff --git a/src/sbuf/Algorithms.h b/src/sbuf/Algorithms.h
c00279
index 21ee889..338e9c0 100644
c00279
--- a/src/sbuf/Algorithms.h
c00279
+++ b/src/sbuf/Algorithms.h
c00279
@@ -81,6 +81,57 @@ SBufContainerJoin(const Container &items, const SBuf& separator)
c00279
     return rv;
c00279
 }
c00279
 
c00279
+/** Join container of SBufs and append to supplied target
c00279
+ *
c00279
+ * append to the target SBuf all elements in the [begin,end) range from
c00279
+ * an iterable container, prefixed by prefix, separated by separator and
c00279
+ * followed by suffix. Prefix and suffix are added also in case of empty
c00279
+ * iterable
c00279
+ *
c00279
+ * \return the modified dest
c00279
+ */
c00279
+template <class ContainerIterator>
c00279
+SBuf&
c00279
+JoinContainerIntoSBuf(SBuf &dest, const ContainerIterator &begin,
c00279
+                      const ContainerIterator &end, const SBuf& separator,
c00279
+                      const SBuf& prefix = SBuf(), const SBuf& suffix = SBuf())
c00279
+{
c00279
+    if (begin == end) {
c00279
+        dest.append(prefix).append(suffix);
c00279
+        return dest;
c00279
+    }
c00279
+
c00279
+    // optimization: pre-calculate needed storage
c00279
+    const SBuf::size_type totalContainerSize =
c00279
+        std::accumulate(begin, end, 0, SBufAddLength(separator)) +
c00279
+        dest.length() + prefix.length() + suffix.length();
c00279
+    SBufReservationRequirements req;
c00279
+    req.minSpace = totalContainerSize;
c00279
+    dest.reserve(req);
c00279
+
c00279
+    auto i = begin;
c00279
+    dest.append(prefix);
c00279
+    dest.append(*i);
c00279
+    ++i;
c00279
+    for (; i != end; ++i)
c00279
+        dest.append(separator).append(*i);
c00279
+    dest.append(suffix);
c00279
+    return dest;
c00279
+}
c00279
+
c00279
+
c00279
+/// convenience wrapper of JoinContainerIntoSBuf with no caller-supplied SBuf
c00279
+template <class ContainerIterator>
c00279
+SBuf
c00279
+JoinContainerToSBuf(const ContainerIterator &begin,
c00279
+                    const ContainerIterator &end, const SBuf& separator,
c00279
+                    const SBuf& prefix = SBuf(), const SBuf& suffix = SBuf())
c00279
+{
c00279
+    SBuf rv;
c00279
+    return JoinContainerIntoSBuf(rv, begin, end, separator, prefix, suffix);
c00279
+}
c00279
+
c00279
+
c00279
 namespace std {
c00279
 /// default hash functor to support std::unordered_map<SBuf,*>
c00279
 template <>