|
|
8e746e |
From a3a7598c8ec6efb0eb9c0b786d80c4d2a3751b70 Mon Sep 17 00:00:00 2001
|
|
|
8e746e |
From: Hugo van der Sanden <hv@crypt.org>
|
|
|
8e746e |
Date: Tue, 18 Feb 2020 13:51:16 +0000
|
|
|
8e746e |
Subject: [PATCH v528 2/3] study_chunk: extract rck_elide_nothing
|
|
|
8e746e |
|
|
|
8e746e |
(CVE-2020-10878)
|
|
|
8e746e |
---
|
|
|
8e746e |
embed.fnc | 1 +
|
|
|
8e746e |
embed.h | 1 +
|
|
|
8e746e |
proto.h | 3 +++
|
|
|
8e746e |
regcomp.c | 70 ++++++++++++++++++++++++++++++++++---------------------
|
|
|
8e746e |
4 files changed, 48 insertions(+), 27 deletions(-)
|
|
|
8e746e |
|
|
|
8e746e |
diff --git a/embed.fnc b/embed.fnc
|
|
|
8e746e |
index e762fe1eec..cf89277163 100644
|
|
|
8e746e |
--- a/embed.fnc
|
|
|
8e746e |
+++ b/embed.fnc
|
|
|
8e746e |
@@ -2398,6 +2398,7 @@ Es |SSize_t|study_chunk |NN RExC_state_t *pRExC_state \
|
|
|
8e746e |
|I32 stopparen|U32 recursed_depth \
|
|
|
8e746e |
|NULLOK regnode_ssc *and_withp \
|
|
|
8e746e |
|U32 flags|U32 depth|bool was_mutate_ok
|
|
|
8e746e |
+Es |void |rck_elide_nothing|NN regnode *node
|
|
|
8e746e |
EsRn |U32 |add_data |NN RExC_state_t* const pRExC_state \
|
|
|
8e746e |
|NN const char* const s|const U32 n
|
|
|
8e746e |
rs |void |re_croak2 |bool utf8|NN const char* pat1|NN const char* pat2|...
|
|
|
8e746e |
diff --git a/embed.h b/embed.h
|
|
|
8e746e |
index a5416a1148..886551ce5c 100644
|
|
|
8e746e |
--- a/embed.h
|
|
|
8e746e |
+++ b/embed.h
|
|
|
8e746e |
@@ -1046,6 +1046,7 @@
|
|
|
8e746e |
#define output_or_return_posix_warnings(a,b,c) S_output_or_return_posix_warnings(aTHX_ a,b,c)
|
|
|
8e746e |
#define parse_lparen_question_flags(a) S_parse_lparen_question_flags(aTHX_ a)
|
|
|
8e746e |
#define populate_ANYOF_from_invlist(a,b) S_populate_ANYOF_from_invlist(aTHX_ a,b)
|
|
|
8e746e |
+#define rck_elide_nothing(a) S_rck_elide_nothing(aTHX_ a)
|
|
|
8e746e |
#define reg(a,b,c,d) S_reg(aTHX_ a,b,c,d)
|
|
|
8e746e |
#define reg2Lanode(a,b,c,d) S_reg2Lanode(aTHX_ a,b,c,d)
|
|
|
8e746e |
#define reg_node(a,b) S_reg_node(aTHX_ a,b)
|
|
|
8e746e |
diff --git a/proto.h b/proto.h
|
|
|
8e746e |
index 66bb29b132..d3f8802c1d 100644
|
|
|
8e746e |
--- a/proto.h
|
|
|
8e746e |
+++ b/proto.h
|
|
|
8e746e |
@@ -5150,6 +5150,9 @@ STATIC void S_parse_lparen_question_flags(pTHX_ RExC_state_t *pRExC_state);
|
|
|
8e746e |
STATIC void S_populate_ANYOF_from_invlist(pTHX_ regnode *node, SV** invlist_ptr);
|
|
|
8e746e |
#define PERL_ARGS_ASSERT_POPULATE_ANYOF_FROM_INVLIST \
|
|
|
8e746e |
assert(node); assert(invlist_ptr)
|
|
|
8e746e |
+STATIC void S_rck_elide_nothing(pTHX_ regnode *node);
|
|
|
8e746e |
+#define PERL_ARGS_ASSERT_RCK_ELIDE_NOTHING \
|
|
|
8e746e |
+ assert(node)
|
|
|
8e746e |
PERL_STATIC_NO_RET void S_re_croak2(pTHX_ bool utf8, const char* pat1, const char* pat2, ...)
|
|
|
8e746e |
__attribute__noreturn__;
|
|
|
8e746e |
#define PERL_ARGS_ASSERT_RE_CROAK2 \
|
|
|
8e746e |
diff --git a/regcomp.c b/regcomp.c
|
|
|
8e746e |
index dd18add1db..0a9c6a8085 100644
|
|
|
8e746e |
--- a/regcomp.c
|
|
|
8e746e |
+++ b/regcomp.c
|
|
|
8e746e |
@@ -4094,6 +4094,43 @@ S_unwind_scan_frames(pTHX_ const void *p)
|
|
|
8e746e |
} while (f);
|
|
|
8e746e |
}
|
|
|
8e746e |
|
|
|
8e746e |
+/* Follow the next-chain of the current node and optimize away
|
|
|
8e746e |
+ all the NOTHINGs from it.
|
|
|
8e746e |
+ */
|
|
|
8e746e |
+STATIC void
|
|
|
8e746e |
+S_rck_elide_nothing(pTHX_ regnode *node)
|
|
|
8e746e |
+{
|
|
|
8e746e |
+ dVAR;
|
|
|
8e746e |
+
|
|
|
8e746e |
+ PERL_ARGS_ASSERT_RCK_ELIDE_NOTHING;
|
|
|
8e746e |
+
|
|
|
8e746e |
+ if (OP(node) != CURLYX) {
|
|
|
8e746e |
+ const int max = (reg_off_by_arg[OP(node)]
|
|
|
8e746e |
+ ? I32_MAX
|
|
|
8e746e |
+ /* I32 may be smaller than U16 on CRAYs! */
|
|
|
8e746e |
+ : (I32_MAX < U16_MAX ? I32_MAX : U16_MAX));
|
|
|
8e746e |
+ int off = (reg_off_by_arg[OP(node)] ? ARG(node) : NEXT_OFF(node));
|
|
|
8e746e |
+ int noff;
|
|
|
8e746e |
+ regnode *n = node;
|
|
|
8e746e |
+
|
|
|
8e746e |
+ /* Skip NOTHING and LONGJMP. */
|
|
|
8e746e |
+ while (
|
|
|
8e746e |
+ (n = regnext(n))
|
|
|
8e746e |
+ && (
|
|
|
8e746e |
+ (PL_regkind[OP(n)] == NOTHING && (noff = NEXT_OFF(n)))
|
|
|
8e746e |
+ || ((OP(n) == LONGJMP) && (noff = ARG(n)))
|
|
|
8e746e |
+ )
|
|
|
8e746e |
+ && off + noff < max
|
|
|
8e746e |
+ ) {
|
|
|
8e746e |
+ off += noff;
|
|
|
8e746e |
+ }
|
|
|
8e746e |
+ if (reg_off_by_arg[OP(node)])
|
|
|
8e746e |
+ ARG(node) = off;
|
|
|
8e746e |
+ else
|
|
|
8e746e |
+ NEXT_OFF(node) = off;
|
|
|
8e746e |
+ }
|
|
|
8e746e |
+ return;
|
|
|
8e746e |
+}
|
|
|
8e746e |
|
|
|
8e746e |
STATIC SSize_t
|
|
|
8e746e |
S_study_chunk(pTHX_ RExC_state_t *pRExC_state, regnode **scanp,
|
|
|
8e746e |
@@ -4197,28 +4234,10 @@ S_study_chunk(pTHX_ RExC_state_t *pRExC_state, regnode **scanp,
|
|
|
8e746e |
if (mutate_ok)
|
|
|
8e746e |
JOIN_EXACT(scan,&min_subtract, &unfolded_multi_char, 0);
|
|
|
8e746e |
|
|
|
8e746e |
- /* Follow the next-chain of the current node and optimize
|
|
|
8e746e |
- away all the NOTHINGs from it. */
|
|
|
8e746e |
- if (OP(scan) != CURLYX) {
|
|
|
8e746e |
- const int max = (reg_off_by_arg[OP(scan)]
|
|
|
8e746e |
- ? I32_MAX
|
|
|
8e746e |
- /* I32 may be smaller than U16 on CRAYs! */
|
|
|
8e746e |
- : (I32_MAX < U16_MAX ? I32_MAX : U16_MAX));
|
|
|
8e746e |
- int off = (reg_off_by_arg[OP(scan)] ? ARG(scan) : NEXT_OFF(scan));
|
|
|
8e746e |
- int noff;
|
|
|
8e746e |
- regnode *n = scan;
|
|
|
8e746e |
-
|
|
|
8e746e |
- /* Skip NOTHING and LONGJMP. */
|
|
|
8e746e |
- while ((n = regnext(n))
|
|
|
8e746e |
- && ((PL_regkind[OP(n)] == NOTHING && (noff = NEXT_OFF(n)))
|
|
|
8e746e |
- || ((OP(n) == LONGJMP) && (noff = ARG(n))))
|
|
|
8e746e |
- && off + noff < max)
|
|
|
8e746e |
- off += noff;
|
|
|
8e746e |
- if (reg_off_by_arg[OP(scan)])
|
|
|
8e746e |
- ARG(scan) = off;
|
|
|
8e746e |
- else
|
|
|
8e746e |
- NEXT_OFF(scan) = off;
|
|
|
8e746e |
- }
|
|
|
8e746e |
+ /* Follow the next-chain of the current node and optimize
|
|
|
8e746e |
+ away all the NOTHINGs from it.
|
|
|
8e746e |
+ */
|
|
|
8e746e |
+ rck_elide_nothing(scan);
|
|
|
8e746e |
|
|
|
8e746e |
/* The principal pseudo-switch. Cannot be a switch, since we
|
|
|
8e746e |
look into several different things. */
|
|
|
8e746e |
@@ -5348,11 +5367,7 @@ Perl_re_printf( aTHX_ "LHS=%" UVuf " RHS=%" UVuf "\n",
|
|
|
8e746e |
if (data && (fl & SF_HAS_EVAL))
|
|
|
8e746e |
data->flags |= SF_HAS_EVAL;
|
|
|
8e746e |
optimize_curly_tail:
|
|
|
8e746e |
- if (OP(oscan) != CURLYX) {
|
|
|
8e746e |
- while (PL_regkind[OP(next = regnext(oscan))] == NOTHING
|
|
|
8e746e |
- && NEXT_OFF(next))
|
|
|
8e746e |
- NEXT_OFF(oscan) += NEXT_OFF(next);
|
|
|
8e746e |
- }
|
|
|
8e746e |
+ rck_elide_nothing(oscan);
|
|
|
8e746e |
continue;
|
|
|
8e746e |
|
|
|
8e746e |
default:
|
|
|
8e746e |
--
|
|
|
8e746e |
2.20.1
|
|
|
8e746e |
|