b8c914
From 07ebe9c4fb1028d17e61caabe8c15abd0cd48983 Mon Sep 17 00:00:00 2001
b8c914
From: Yves Orton <demerphq@gmail.com>
b8c914
Date: Thu, 29 Jun 2017 11:31:14 +0200
b8c914
Subject: [PATCH] Parse caret vars with subscripts the same as normal vars
b8c914
 inside of ${..} escaping
b8c914
MIME-Version: 1.0
b8c914
Content-Type: text/plain; charset=UTF-8
b8c914
Content-Transfer-Encoding: 8bit
b8c914
b8c914
This behavior is discussed in perl #131664, which complains that
b8c914
"${^CAPTURE}[0]" does not work as expected. Abigail explains the
b8c914
behavior is by design and Eirik Berg Hanssen expands on that explanation
b8c914
pointing out that what /should/ work, "${^CAPTURE[0]}" does not,
b8c914
which Sawyer then ruled was a bug.
b8c914
b8c914
So this patch makes "${^CAPTURE[0]}" (and "${^CAPTURE [0]}" [hi
b8c914
abigial]) work the same as they would if the var was called @foo.
b8c914
b8c914
Petr Písař: Ported to 5.26.2-RC1.
b8c914
b8c914
Signed-off-by: Petr Písař <ppisar@redhat.com>
b8c914
---
b8c914
 t/base/lex.t | 28 +++++++++++++++++++++++++++-
b8c914
 toke.c       | 46 +++++++++++++++++++++++++---------------------
b8c914
 2 files changed, 52 insertions(+), 22 deletions(-)
b8c914
b8c914
diff --git a/t/base/lex.t b/t/base/lex.t
b8c914
index 99fd3bb..ae17bbd 100644
b8c914
--- a/t/base/lex.t
b8c914
+++ b/t/base/lex.t
b8c914
@@ -1,6 +1,6 @@
b8c914
 #!./perl
b8c914
 
b8c914
-print "1..112\n";
b8c914
+print "1..119\n";
b8c914
 
b8c914
 $x = 'x';
b8c914
 
b8c914
@@ -154,6 +154,32 @@ my $test = 31;
b8c914
   print "not " unless index ($@, 'Can\'t use global $^XYZ in "my"') > -1;
b8c914
   print "ok $test\n"; $test++;
b8c914
 #  print "($@)\n" if $@;
b8c914
+#
b8c914
+  ${^TEST}= "splat";
b8c914
+  @{^TEST}= ("foo", "bar");
b8c914
+  %{^TEST}= ("foo" => "FOO", "bar" => "BAR" );
b8c914
+
b8c914
+  print "not " if "${^TEST}" ne "splat";
b8c914
+  print "ok $test\n"; $test++;
b8c914
+
b8c914
+  print "not " if "${^TEST}[0]" ne "splat[0]";
b8c914
+  print "ok $test\n"; $test++;
b8c914
+
b8c914
+  print "not " if "${^TEST[0]}" ne "foo";
b8c914
+  print "ok $test\n"; $test++;
b8c914
+
b8c914
+  print "not " if "${ ^TEST [1] }" ne "bar";
b8c914
+  print "ok $test\n"; $test++;
b8c914
+
b8c914
+  print "not " if "${^TEST}{foo}" ne "splat{foo}";
b8c914
+  print "ok $test\n"; $test++;
b8c914
+
b8c914
+  print "not " if "${^TEST{foo}}" ne "FOO";
b8c914
+  print "ok $test\n"; $test++;
b8c914
+
b8c914
+  print "not " if "${ ^TEST {bar} }" ne "BAR";
b8c914
+  print "ok $test\n"; $test++;
b8c914
+
b8c914
 
b8c914
 # Now let's make sure that caret variables are all forced into the main package.
b8c914
   package Someother;
b8c914
diff --git a/toke.c b/toke.c
b8c914
index ee9c464..aff785b 100644
b8c914
--- a/toke.c
b8c914
+++ b/toke.c
b8c914
@@ -9416,19 +9416,36 @@ S_scan_ident(pTHX_ char *s, char *dest, STRLEN destlen, I32 ck_uni)
b8c914
         bool skip;
b8c914
         char *s2;
b8c914
         /* If we were processing {...} notation then...  */
b8c914
-        if (isIDFIRST_lazy_if_safe(d, e, is_utf8)) {
b8c914
-            /* if it starts as a valid identifier, assume that it is one.
b8c914
-               (the later check for } being at the expected point will trap
b8c914
-               cases where this doesn't pan out.)  */
b8c914
-            d += is_utf8 ? UTF8SKIP(d) : 1;
b8c914
-            parse_ident(&s, &d, e, 1, is_utf8, TRUE);
b8c914
-	    *d = '\0';
b8c914
+        if (isIDFIRST_lazy_if_safe(d, e, is_utf8)
b8c914
+            || (!isPRINT(*d) /* isCNTRL(d), plus all non-ASCII */
b8c914
+                 && isWORDCHAR(*s))
b8c914
+        ) {
b8c914
+            /* note we have to check for a normal identifier first,
b8c914
+             * as it handles utf8 symbols, and only after that has
b8c914
+             * been ruled out can we look at the caret words */
b8c914
+            if (isIDFIRST_lazy_if_safe(d, e, is_utf8) ) {
b8c914
+                /* if it starts as a valid identifier, assume that it is one.
b8c914
+                   (the later check for } being at the expected point will trap
b8c914
+                   cases where this doesn't pan out.)  */
b8c914
+                d += is_utf8 ? UTF8SKIP(d) : 1;
b8c914
+                parse_ident(&s, &d, e, 1, is_utf8, TRUE);
b8c914
+                *d = '\0';
b8c914
+            }
b8c914
+            else { /* caret word: ${^Foo} ${^CAPTURE[0]} */
b8c914
+                d++;
b8c914
+                while (isWORDCHAR(*s) && d < e) {
b8c914
+                    *d++ = *s++;
b8c914
+                }
b8c914
+                if (d >= e)
b8c914
+                    Perl_croak(aTHX_ "%s", ident_too_long);
b8c914
+                *d = '\0';
b8c914
+            }
b8c914
             tmp_copline = CopLINE(PL_curcop);
b8c914
             if (s < PL_bufend && isSPACE(*s)) {
b8c914
                 s = skipspace(s);
b8c914
             }
b8c914
 	    if ((*s == '[' || (*s == '{' && strNE(dest, "sub")))) {
b8c914
-                /* ${foo[0]} and ${foo{bar}} notation.  */
b8c914
+                /* ${foo[0]} and ${foo{bar}} and ${^CAPTURE[0]} notation.  */
b8c914
 		if (ckWARN(WARN_AMBIGUOUS) && keyword(dest, d - dest, 0)) {
b8c914
 		    const char * const brack =
b8c914
 			(const char *)
b8c914
@@ -9447,19 +9464,6 @@ S_scan_ident(pTHX_ char *s, char *dest, STRLEN destlen, I32 ck_uni)
b8c914
 		return s;
b8c914
 	    }
b8c914
 	}
b8c914
-	/* Handle extended ${^Foo} variables
b8c914
-	 * 1999-02-27 mjd-perl-patch@plover.com */
b8c914
-	else if (! isPRINT(*d) /* isCNTRL(d), plus all non-ASCII */
b8c914
-		 && isWORDCHAR(*s))
b8c914
-	{
b8c914
-	    d++;
b8c914
-	    while (isWORDCHAR(*s) && d < e) {
b8c914
-		*d++ = *s++;
b8c914
-	    }
b8c914
-	    if (d >= e)
b8c914
-		Perl_croak(aTHX_ "%s", ident_too_long);
b8c914
-	    *d = '\0';
b8c914
-	}
b8c914
 
b8c914
         if ( !tmp_copline )
b8c914
             tmp_copline = CopLINE(PL_curcop);
b8c914
-- 
b8c914
2.14.3
b8c914