Regex: Update PCRE to v8.35.
I was über lazy at first, so took libs from SM. But actually it's quite easy to compile, so let's update to latest version \o/.
This commit is contained in:
76
tools/pcre/testdata/testoutput18-32
vendored
76
tools/pcre/testdata/testoutput18-32
vendored
@ -1,5 +1,7 @@
|
||||
/-- This set of tests is for UTF-16 and UTF-32 support, and is relevant only to the
|
||||
16- and 32-bit library. --/
|
||||
/-- This set of tests is for UTF-16 and UTF-32 support, and is relevant only to
|
||||
the 16- and 32-bit libraries. --/
|
||||
|
||||
< forbid W
|
||||
|
||||
/<2F><><EFBFBD>xxx/8?DZSS
|
||||
**Failed: invalid UTF-8 string cannot be converted to UTF-32
|
||||
@ -335,7 +337,7 @@ Options: utf
|
||||
No first char
|
||||
No need char
|
||||
Subject length lower bound = 1
|
||||
Starting byte set: \x00 \x01 \x02 \x03 \x04 \x05 \x06 \x07 \x08 \x09 \x0a
|
||||
Starting chars: \x00 \x01 \x02 \x03 \x04 \x05 \x06 \x07 \x08 \x09 \x0a
|
||||
\x0b \x0c \x0d \x0e \x0f \x10 \x11 \x12 \x13 \x14 \x15 \x16 \x17 \x18 \x19
|
||||
\x1a \x1b \x1c \x1d \x1e \x1f \x20 ! " # $ % & ' ( ) * + , - . / 0 1 2 3 4
|
||||
5 6 7 8 9 : ; < = > ? @ A B C D E F G H I J K L M N O P Q R S T U V W X Y
|
||||
@ -365,7 +367,7 @@ No match
|
||||
------------------------------------------------------------------
|
||||
Bra
|
||||
\x{100}{3}
|
||||
\x{100}?
|
||||
\x{100}?+
|
||||
Ket
|
||||
End
|
||||
------------------------------------------------------------------
|
||||
@ -374,7 +376,7 @@ Options: utf
|
||||
First char = \x{100}
|
||||
Need char = \x{100}
|
||||
Subject length lower bound = 3
|
||||
No set of starting bytes
|
||||
No starting char list
|
||||
\x{100}\x{100}\x{100}\x{100\x{100}
|
||||
0: \x{100}\x{100}\x{100}
|
||||
|
||||
@ -382,7 +384,7 @@ No set of starting bytes
|
||||
------------------------------------------------------------------
|
||||
Bra
|
||||
CBra 1
|
||||
\x{100}+
|
||||
\x{100}++
|
||||
Alt
|
||||
x
|
||||
Ket
|
||||
@ -394,7 +396,7 @@ Options: utf
|
||||
No first char
|
||||
No need char
|
||||
Subject length lower bound = 1
|
||||
Starting byte set: x \xff
|
||||
Starting chars: x \xff
|
||||
|
||||
/(\x{100}*a|x)/8SDZ
|
||||
------------------------------------------------------------------
|
||||
@ -413,13 +415,13 @@ Options: utf
|
||||
No first char
|
||||
No need char
|
||||
Subject length lower bound = 1
|
||||
Starting byte set: a x \xff
|
||||
Starting chars: a x \xff
|
||||
|
||||
/(\x{100}{0,2}a|x)/8SDZ
|
||||
------------------------------------------------------------------
|
||||
Bra
|
||||
CBra 1
|
||||
\x{100}{0,2}
|
||||
\x{100}{0,2}+
|
||||
a
|
||||
Alt
|
||||
x
|
||||
@ -432,14 +434,14 @@ Options: utf
|
||||
No first char
|
||||
No need char
|
||||
Subject length lower bound = 1
|
||||
Starting byte set: a x \xff
|
||||
Starting chars: a x \xff
|
||||
|
||||
/(\x{100}{1,2}a|x)/8SDZ
|
||||
------------------------------------------------------------------
|
||||
Bra
|
||||
CBra 1
|
||||
\x{100}
|
||||
\x{100}{0,1}
|
||||
\x{100}{0,1}+
|
||||
a
|
||||
Alt
|
||||
x
|
||||
@ -452,7 +454,7 @@ Options: utf
|
||||
No first char
|
||||
No need char
|
||||
Subject length lower bound = 1
|
||||
Starting byte set: x \xff
|
||||
Starting chars: x \xff
|
||||
|
||||
/\x{100}/8DZ
|
||||
------------------------------------------------------------------
|
||||
@ -470,7 +472,7 @@ No need char
|
||||
------------------------------------------------------------------
|
||||
Bra
|
||||
a\x{100}
|
||||
\x{101}*
|
||||
\x{101}*+
|
||||
Ket
|
||||
End
|
||||
------------------------------------------------------------------
|
||||
@ -483,7 +485,7 @@ Need char = \x{100}
|
||||
------------------------------------------------------------------
|
||||
Bra
|
||||
a\x{100}
|
||||
\x{101}+
|
||||
\x{101}++
|
||||
Ket
|
||||
End
|
||||
------------------------------------------------------------------
|
||||
@ -606,8 +608,6 @@ Need char = 'X'
|
||||
Failed: missing terminating ] for character class at offset 13
|
||||
|
||||
/X/8
|
||||
\x{0}\x{d7ff}\x{e000}\x{10ffff}
|
||||
Error -10 (bad UTF-32 string) offset=3 reason=2
|
||||
\x{d800}
|
||||
Error -10 (bad UTF-32 string) offset=0 reason=1
|
||||
\x{d800}\?
|
||||
@ -632,11 +632,9 @@ No match
|
||||
Error -10 (bad UTF-32 string) offset=0 reason=3
|
||||
\x{d800}\x{1234}
|
||||
Error -10 (bad UTF-32 string) offset=0 reason=1
|
||||
\x{fffe}
|
||||
Error -10 (bad UTF-32 string) offset=0 reason=2
|
||||
|
||||
/(*UTF16)\x{11234}/
|
||||
Failed: (*VERB) not recognized at offset 5
|
||||
Failed: (*VERB) not recognized or malformed at offset 5
|
||||
|
||||
/(*UTF)\x{11234}/I
|
||||
Capturing subpattern count = 0
|
||||
@ -647,10 +645,10 @@ No need char
|
||||
0: \x{11234}
|
||||
|
||||
/(*UTF-32)\x{11234}/
|
||||
Failed: (*VERB) not recognized at offset 5
|
||||
Failed: (*VERB) not recognized or malformed at offset 5
|
||||
|
||||
/(*CRLF)(*UTF16)(*BSR_UNICODE)a\Rb/I
|
||||
Failed: (*VERB) not recognized at offset 12
|
||||
Failed: (*VERB) not recognized or malformed at offset 12
|
||||
|
||||
/(*CRLF)(*UTF32)(*BSR_UNICODE)a\Rb/I
|
||||
Capturing subpattern count = 0
|
||||
@ -665,7 +663,7 @@ Options: utf
|
||||
No first char
|
||||
No need char
|
||||
Subject length lower bound = 1
|
||||
Starting byte set: \x09 \x20 \xa0 \xff
|
||||
Starting chars: \x09 \x20 \xa0 \xff
|
||||
ABC\x{09}
|
||||
0: \x{09}
|
||||
ABC\x{20}
|
||||
@ -691,7 +689,7 @@ Options: utf
|
||||
No first char
|
||||
No need char
|
||||
Subject length lower bound = 1
|
||||
Starting byte set: \x0a \x0b \x0c \x0d \x85 \xff
|
||||
Starting chars: \x0a \x0b \x0c \x0d \x85 \xff
|
||||
ABC\x{0a}
|
||||
0: \x{0a}
|
||||
ABC\x{0b}
|
||||
@ -711,19 +709,19 @@ Options: utf
|
||||
No first char
|
||||
Need char = 'A'
|
||||
Subject length lower bound = 1
|
||||
Starting byte set: \x09 \x20 A \xa0 \xff
|
||||
Starting chars: \x09 \x20 A \xa0 \xff
|
||||
CDBABC
|
||||
0: A
|
||||
\x{2000}ABC
|
||||
0: \x{2000}A
|
||||
|
||||
/\R*A/SI8
|
||||
/\R*A/SI8<bsr_unicode>
|
||||
Capturing subpattern count = 0
|
||||
Options: utf
|
||||
Options: bsr_unicode utf
|
||||
No first char
|
||||
Need char = 'A'
|
||||
Subject length lower bound = 1
|
||||
Starting byte set: \x0a \x0b \x0c \x0d A \x85 \xff
|
||||
Starting chars: \x0a \x0b \x0c \x0d A \x85 \xff
|
||||
CDBABC
|
||||
0: A
|
||||
\x{2028}A
|
||||
@ -735,7 +733,7 @@ Options: utf
|
||||
No first char
|
||||
Need char = 'A'
|
||||
Subject length lower bound = 2
|
||||
Starting byte set: \x0a \x0b \x0c \x0d \x85 \xff
|
||||
Starting chars: \x0a \x0b \x0c \x0d \x85 \xff
|
||||
|
||||
/\s?xxx\s/8SI
|
||||
Capturing subpattern count = 0
|
||||
@ -743,7 +741,7 @@ Options: utf
|
||||
No first char
|
||||
Need char = 'x'
|
||||
Subject length lower bound = 4
|
||||
Starting byte set: \x09 \x0a \x0c \x0d \x20 x
|
||||
Starting chars: \x09 \x0a \x0b \x0c \x0d \x20 x
|
||||
|
||||
/\sxxx\s/I8ST1
|
||||
Capturing subpattern count = 0
|
||||
@ -751,7 +749,7 @@ Options: utf
|
||||
No first char
|
||||
Need char = 'x'
|
||||
Subject length lower bound = 5
|
||||
Starting byte set: \x09 \x0a \x0c \x0d \x20 \x85 \xa0
|
||||
Starting chars: \x09 \x0a \x0c \x0d \x20 \x85 \xa0
|
||||
AB\x{85}xxx\x{a0}XYZ
|
||||
0: \x{85}xxx\x{a0}
|
||||
AB\x{a0}xxx\x{85}XYZ
|
||||
@ -763,7 +761,7 @@ Options: utf
|
||||
No first char
|
||||
Need char = ' '
|
||||
Subject length lower bound = 3
|
||||
Starting byte set: \x00 \x01 \x02 \x03 \x04 \x05 \x06 \x07 \x08 \x0b \x0e
|
||||
Starting chars: \x00 \x01 \x02 \x03 \x04 \x05 \x06 \x07 \x08 \x0b \x0e
|
||||
\x0f \x10 \x11 \x12 \x13 \x14 \x15 \x16 \x17 \x18 \x19 \x1a \x1b \x1c \x1d
|
||||
\x1e \x1f ! " # $ % & ' ( ) * + , - . / 0 1 2 3 4 5 6 7 8 9 : ; < = > ? @
|
||||
A B C D E F G H I J K L M N O P Q R S T U V W X Y Z [ \ ] ^ _ ` a b c d e
|
||||
@ -802,7 +800,7 @@ Options: caseless utf
|
||||
First char = \x{1234}
|
||||
No need char
|
||||
Subject length lower bound = 1
|
||||
No set of starting bytes
|
||||
No starting char list
|
||||
|
||||
/\x{1234}+?/iS8I
|
||||
Capturing subpattern count = 0
|
||||
@ -810,7 +808,7 @@ Options: caseless utf
|
||||
First char = \x{1234}
|
||||
No need char
|
||||
Subject length lower bound = 1
|
||||
No set of starting bytes
|
||||
No starting char list
|
||||
|
||||
/\x{1234}++/iS8I
|
||||
Capturing subpattern count = 0
|
||||
@ -818,7 +816,7 @@ Options: caseless utf
|
||||
First char = \x{1234}
|
||||
No need char
|
||||
Subject length lower bound = 1
|
||||
No set of starting bytes
|
||||
No starting char list
|
||||
|
||||
/\x{1234}{2}/iS8I
|
||||
Capturing subpattern count = 0
|
||||
@ -826,7 +824,7 @@ Options: caseless utf
|
||||
First char = \x{1234}
|
||||
Need char = \x{1234}
|
||||
Subject length lower bound = 2
|
||||
No set of starting bytes
|
||||
No starting char list
|
||||
|
||||
/[^\x{c4}]/8DZ
|
||||
------------------------------------------------------------------
|
||||
@ -859,7 +857,7 @@ Options: utf
|
||||
No first char
|
||||
No need char
|
||||
Subject length lower bound = 1
|
||||
Starting byte set: \x0a \x0b \x0c \x0d \x85 \xff
|
||||
Starting chars: \x0a \x0b \x0c \x0d \x85 \xff
|
||||
|
||||
/-- Check bad offset --/
|
||||
|
||||
@ -1016,4 +1014,10 @@ Error -24 (bad offset value)
|
||||
\x{a0}\x20!
|
||||
0: \x{a0} !
|
||||
|
||||
/(*UTF)abc/9
|
||||
Failed: setting UTF is disabled by the application at offset 0
|
||||
|
||||
/abc/89
|
||||
Failed: setting UTF is disabled by the application at offset 0
|
||||
|
||||
/-- End of testinput18 --/
|
||||
|
Reference in New Issue
Block a user