Fix read/write past buffer end

author afresh1 <afresh1@openbsd.org>

Sun, 26 Nov 2023 16:52:12 +0000 (16:52 +0000)

committer afresh1 <afresh1@openbsd.org>

Sun, 26 Nov 2023 16:52:12 +0000 (16:52 +0000)
author afresh1 <afresh1@openbsd.org>
Sun, 26 Nov 2023 16:52:12 +0000 (16:52 +0000)
committer afresh1 <afresh1@openbsd.org>
Sun, 26 Nov 2023 16:52:12 +0000 (16:52 +0000)
diff --git a/gnu/usr.bin/perl/regcomp.c b/gnu/usr.bin/perl/regcomp.c

index 881c26c..7442e66 100644 (file)
--- a/gnu/usr.bin/perl/regcomp.c
+++ b/gnu/usr.bin/perl/regcomp.c
@@ -24250,7 +24250,7 @@ S_parse_uniprop_string(pTHX_
       * compile perl to know about them) */
      bool is_nv_type = FALSE;
  
-    unsigned int i, j = 0;
+    unsigned int i = 0, i_zero = 0, j = 0;
      int equals_pos = -1;    /* Where the '=' is found, or negative if none */
      int slash_pos  = -1;    /* Where the '/' is found, or negative if none */
      int table_index = 0;    /* The entry number for this property in the table
@@ -24384,9 +24384,13 @@ S_parse_uniprop_string(pTHX_
       * all of them are considered to be for that package.  For the purposes of
       * parsing the rest of the property, strip it off */
      if (non_pkg_begin == STRLENs("utf8::") && memBEGINPs(name, name_len, "utf8::")) {
-        lookup_name +=  STRLENs("utf8::");
-        j -=  STRLENs("utf8::");
-        equals_pos -=  STRLENs("utf8::");
+        lookup_name += STRLENs("utf8::");
+        j           -= STRLENs("utf8::");
+        equals_pos  -= STRLENs("utf8::");
+        i_zero       = STRLENs("utf8::");   /* When resetting 'i' to reparse
+                                               from the beginning, it has to be
+                                               set past what we're stripping
+                                               off */
          stripped_utf8_pkg = TRUE;
      }
  
@@ -24800,7 +24804,8 @@ S_parse_uniprop_string(pTHX_
  
              /* We set the inputs back to 0 and the code below will reparse,
               * using strict */
-            i = j = 0;
+            i = i_zero;
+            j = 0;
          }
      }
  
@@ -24821,7 +24826,7 @@ S_parse_uniprop_string(pTHX_
           * separates two digits */
          if (cur == '_') {
              if (    stricter
-                && (     i == 0 || (int) i == equals_pos || i == name_len- 1
+                && (   i == i_zero || (int) i == equals_pos || i == name_len- 1
                      || ! isDIGIT_A(name[i-1]) || ! isDIGIT_A(name[i+1])))
              {
                  lookup_name[j++] = '_';
diff --git a/gnu/usr.bin/perl/t/re/pat_advanced.t b/gnu/usr.bin/perl/t/re/pat_advanced.t

index 2a25411..088efed 100755 (executable)
--- a/gnu/usr.bin/perl/t/re/pat_advanced.t
+++ b/gnu/usr.bin/perl/t/re/pat_advanced.t
@@ -2688,6 +2688,14 @@ EOF_DEBUG_OUT
                        {}, "Related to Github Issue #19350, forward \\g{x} pattern segv under use re Debug => 'PARSE'");
      }
  
+    {   # perl-security#140, read/write past buffer end
+        fresh_perl_like('qr/\p{utf8::perl x}/',
+                        qr/Illegal user-defined property name "utf8::perl x" in regex/,
+                        {}, "perl-security#140");
+        fresh_perl_is('qr/\p{utf8::_perl_surrogate}/', "",
+                        {}, "perl-security#140");
+    }
+
  
      # !!! NOTE that tests that aren't at all likely to crash perl should go
      # a ways above, above these last ones.  There's a comment there that, like
author	afresh1 <afresh1@openbsd.org>
	Sun, 26 Nov 2023 16:52:12 +0000 (16:52 +0000)
committer	afresh1 <afresh1@openbsd.org>
	Sun, 26 Nov 2023 16:52:12 +0000 (16:52 +0000)
gnu/usr.bin/perl/regcomp.c		patch \| blob \| history
gnu/usr.bin/perl/t/re/pat_advanced.t		patch \| blob \| history