Blame SOURCES/squid-4.0.21-large-acl.patch

5e05d2
diff --git a/src/acl/RegexData.cc b/src/acl/RegexData.cc
5e05d2
index 01a4c12..b5c1679 100644
5e05d2
--- a/src/acl/RegexData.cc
5e05d2
+++ b/src/acl/RegexData.cc
5e05d2
@@ -22,6 +22,7 @@
5e05d2
 #include "ConfigParser.h"
5e05d2
 #include "Debug.h"
5e05d2
 #include "sbuf/List.h"
5e05d2
+#include "sbuf/Algorithms.h"
5e05d2
 
5e05d2
 ACLRegexData::~ACLRegexData()
5e05d2
 {
5e05d2
@@ -129,6 +130,18 @@ compileRE(std::list<RegexPattern> &curlist, const char * RE, int flags)
5e05d2
     return true;
5e05d2
 }
5e05d2
 
5e05d2
+static bool
5e05d2
+compileRE(std::list<RegexPattern> &curlist, const SBufList &RE, int flags)
5e05d2
+{
5e05d2
+	if (RE.empty())
5e05d2
+		return curlist.empty(); // XXX: old code did this. It looks wrong.
5e05d2
+	SBuf regexp;
5e05d2
+	static const SBuf openparen("("), closeparen(")"), separator(")|(");
5e05d2
+	JoinContainerIntoSBuf(regexp, RE.begin(), RE.end(), separator, openparen,
5e05d2
+			closeparen);
5e05d2
+	return compileRE(curlist, regexp.c_str(), flags);
5e05d2
+}
5e05d2
+
5e05d2
 /** Compose and compile one large RE from a set of (small) REs.
5e05d2
  * The ultimate goal is to have only one RE per ACL so that match() is
5e05d2
  * called only once per ACL.
5e05d2
@@ -137,16 +150,11 @@ static int
5e05d2
 compileOptimisedREs(std::list<RegexPattern> &curlist, const SBufList &sl)
5e05d2
 {
5e05d2
     std::list<RegexPattern> newlist;
5e05d2
-    int numREs = 0;
5e05d2
+    SBufList accumulatedRE;
5e05d2
+    int numREs = 0, reSize = 0;
5e05d2
     int flags = REG_EXTENDED | REG_NOSUB;
5e05d2
-    int largeREindex = 0;
5e05d2
-    char largeRE[BUFSIZ];
5e05d2
-    *largeRE = 0;
5e05d2
 
5e05d2
     for (const SBuf & configurationLineWord : sl) {
5e05d2
-        int RElen;
5e05d2
-        RElen = configurationLineWord.length();
5e05d2
-
5e05d2
         static const SBuf minus_i("-i");
5e05d2
         static const SBuf plus_i("+i");
5e05d2
         if (configurationLineWord == minus_i) {
5e05d2
@@ -155,10 +163,11 @@ compileOptimisedREs(std::list<RegexPattern> &curlist, const SBufList &sl)
5e05d2
                 debugs(28, 2, "optimisation of -i ... -i" );
5e05d2
             } else {
5e05d2
                 debugs(28, 2, "-i" );
5e05d2
-                if (!compileRE(newlist, largeRE, flags))
5e05d2
+                if (!compileRE(newlist, accumulatedRE, flags))
5e05d2
                     return 0;
5e05d2
                 flags |= REG_ICASE;
5e05d2
-                largeRE[largeREindex=0] = '\0';
5e05d2
+                accumulatedRE.clear();
5e05d2
+                reSize = 0;
5e05d2
             }
5e05d2
         } else if (configurationLineWord == plus_i) {
5e05d2
             if ((flags & REG_ICASE) == 0) {
5e05d2
@@ -166,37 +175,34 @@ compileOptimisedREs(std::list<RegexPattern> &curlist, const SBufList &sl)
5e05d2
                 debugs(28, 2, "optimisation of +i ... +i");
5e05d2
             } else {
5e05d2
                 debugs(28, 2, "+i");
5e05d2
-                if (!compileRE(newlist, largeRE, flags))
5e05d2
+                if (!compileRE(newlist, accumulatedRE, flags))
5e05d2
                     return 0;
5e05d2
                 flags &= ~REG_ICASE;
5e05d2
-                largeRE[largeREindex=0] = '\0';
5e05d2
+                accumulatedRE.clear();
5e05d2
+                reSize = 0;
5e05d2
             }
5e05d2
-        } else if (RElen + largeREindex + 3 < BUFSIZ-1) {
5e05d2
+        } else if (reSize < 1024) {
5e05d2
             debugs(28, 2, "adding RE '" << configurationLineWord << "'");
5e05d2
-            if (largeREindex > 0) {
5e05d2
-                largeRE[largeREindex] = '|';
5e05d2
-                ++largeREindex;
5e05d2
-            }
5e05d2
-            largeRE[largeREindex] = '(';
5e05d2
-            ++largeREindex;
5e05d2
-            configurationLineWord.copy(largeRE+largeREindex, BUFSIZ-largeREindex);
5e05d2
-            largeREindex += configurationLineWord.length();
5e05d2
-            largeRE[largeREindex] = ')';
5e05d2
-            ++largeREindex;
5e05d2
-            largeRE[largeREindex] = '\0';
5e05d2
+            accumulatedRE.push_back(configurationLineWord);
5e05d2
             ++numREs;
5e05d2
+            reSize += configurationLineWord.length();
5e05d2
         } else {
5e05d2
             debugs(28, 2, "buffer full, generating new optimised RE..." );
5e05d2
-            if (!compileRE(newlist, largeRE, flags))
5e05d2
+            accumulatedRE.push_back(configurationLineWord);
5e05d2
+            if (!compileRE(newlist, accumulatedRE, flags))
5e05d2
                 return 0;
5e05d2
-            largeRE[largeREindex=0] = '\0';
5e05d2
+            accumulatedRE.clear();
5e05d2
+            reSize = 0;
5e05d2
             continue;    /* do the loop again to add the RE to largeRE */
5e05d2
         }
5e05d2
     }
5e05d2
 
5e05d2
-    if (!compileRE(newlist, largeRE, flags))
5e05d2
+    if (!compileRE(newlist, accumulatedRE, flags))
5e05d2
         return 0;
5e05d2
 
5e05d2
+    accumulatedRE.clear();
5e05d2
+    reSize = 0;
5e05d2
+
5e05d2
     /* all was successful, so put the new list at the tail */
5e05d2
     curlist.splice(curlist.end(), newlist);
5e05d2
 
5e05d2
diff --git a/src/sbuf/Algorithms.h b/src/sbuf/Algorithms.h
5e05d2
index 21ee889..338e9c0 100644
5e05d2
--- a/src/sbuf/Algorithms.h
5e05d2
+++ b/src/sbuf/Algorithms.h
5e05d2
@@ -81,6 +81,57 @@ SBufContainerJoin(const Container &items, const SBuf& separator)
5e05d2
     return rv;
5e05d2
 }
5e05d2
 
5e05d2
+/** Join container of SBufs and append to supplied target
5e05d2
+ *
5e05d2
+ * append to the target SBuf all elements in the [begin,end) range from
5e05d2
+ * an iterable container, prefixed by prefix, separated by separator and
5e05d2
+ * followed by suffix. Prefix and suffix are added also in case of empty
5e05d2
+ * iterable
5e05d2
+ *
5e05d2
+ * \return the modified dest
5e05d2
+ */
5e05d2
+template <class ContainerIterator>
5e05d2
+SBuf&
5e05d2
+JoinContainerIntoSBuf(SBuf &dest, const ContainerIterator &begin,
5e05d2
+                      const ContainerIterator &end, const SBuf& separator,
5e05d2
+                      const SBuf& prefix = SBuf(), const SBuf& suffix = SBuf())
5e05d2
+{
5e05d2
+    if (begin == end) {
5e05d2
+        dest.append(prefix).append(suffix);
5e05d2
+        return dest;
5e05d2
+    }
5e05d2
+
5e05d2
+    // optimization: pre-calculate needed storage
5e05d2
+    const SBuf::size_type totalContainerSize =
5e05d2
+        std::accumulate(begin, end, 0, SBufAddLength(separator)) +
5e05d2
+        dest.length() + prefix.length() + suffix.length();
5e05d2
+    SBufReservationRequirements req;
5e05d2
+    req.minSpace = totalContainerSize;
5e05d2
+    dest.reserve(req);
5e05d2
+
5e05d2
+    auto i = begin;
5e05d2
+    dest.append(prefix);
5e05d2
+    dest.append(*i);
5e05d2
+    ++i;
5e05d2
+    for (; i != end; ++i)
5e05d2
+        dest.append(separator).append(*i);
5e05d2
+    dest.append(suffix);
5e05d2
+    return dest;
5e05d2
+}
5e05d2
+
5e05d2
+
5e05d2
+/// convenience wrapper of JoinContainerIntoSBuf with no caller-supplied SBuf
5e05d2
+template <class ContainerIterator>
5e05d2
+SBuf
5e05d2
+JoinContainerToSBuf(const ContainerIterator &begin,
5e05d2
+                    const ContainerIterator &end, const SBuf& separator,
5e05d2
+                    const SBuf& prefix = SBuf(), const SBuf& suffix = SBuf())
5e05d2
+{
5e05d2
+    SBuf rv;
5e05d2
+    return JoinContainerIntoSBuf(rv, begin, end, separator, prefix, suffix);
5e05d2
+}
5e05d2
+
5e05d2
+
5e05d2
 namespace std {
5e05d2
 /// default hash functor to support std::unordered_map<SBuf,*>
5e05d2
 template <>