1 /-- This set of tests is for UTF-16 and UTF-32 support, and is relevant only to the
2 16- and 32-bit library. --/
5 **Failed: invalid UTF-8 string cannot be converted to UTF-32
9 **Failed: invalid UTF-8 string cannot be used as input in UTF mode
43 0: X\x{11234}\x{512}YZ
44 X\x{11234}\x{512}\x{11234}Z
45 0: X\x{11234}\x{512}\x{11234}Z
71 0: a\x{12257}\x{11234}b
81 /-- Check maximum character size --/
84 ------------------------------------------------------------------
89 ------------------------------------------------------------------
90 Capturing subpattern count = 0
96 ------------------------------------------------------------------
101 ------------------------------------------------------------------
102 Capturing subpattern count = 0
104 First char = \x{10000}
108 ------------------------------------------------------------------
113 ------------------------------------------------------------------
114 Capturing subpattern count = 0
120 ------------------------------------------------------------------
125 ------------------------------------------------------------------
126 Capturing subpattern count = 0
128 First char = \x{1000}
132 ------------------------------------------------------------------
137 ------------------------------------------------------------------
138 Capturing subpattern count = 0
140 First char = \x{10000}
144 ------------------------------------------------------------------
149 ------------------------------------------------------------------
150 Capturing subpattern count = 0
152 First char = \x{100000}
156 ------------------------------------------------------------------
161 ------------------------------------------------------------------
162 Capturing subpattern count = 0
164 First char = \x{10ffff}
168 ------------------------------------------------------------------
173 ------------------------------------------------------------------
174 Capturing subpattern count = 0
180 ------------------------------------------------------------------
185 ------------------------------------------------------------------
186 Capturing subpattern count = 0
192 ------------------------------------------------------------------
197 ------------------------------------------------------------------
198 Capturing subpattern count = 0
204 ------------------------------------------------------------------
209 ------------------------------------------------------------------
210 Capturing subpattern count = 0
215 /\x{D55c}\x{ad6d}\x{C5B4}/DZ8
216 ------------------------------------------------------------------
218 \x{d55c}\x{ad6d}\x{c5b4}
221 ------------------------------------------------------------------
222 Capturing subpattern count = 0
224 First char = \x{d55c}
226 \x{D55c}\x{ad6d}\x{C5B4}
227 0: \x{d55c}\x{ad6d}\x{c5b4}
229 /\x{65e5}\x{672c}\x{8a9e}/DZ8
230 ------------------------------------------------------------------
232 \x{65e5}\x{672c}\x{8a9e}
235 ------------------------------------------------------------------
236 Capturing subpattern count = 0
238 First char = \x{65e5}
240 \x{65e5}\x{672c}\x{8a9e}
241 0: \x{65e5}\x{672c}\x{8a9e}
244 ------------------------------------------------------------------
249 ------------------------------------------------------------------
250 Capturing subpattern count = 0
256 ------------------------------------------------------------------
261 ------------------------------------------------------------------
262 Capturing subpattern count = 0
268 ------------------------------------------------------------------
273 ------------------------------------------------------------------
274 Capturing subpattern count = 0
280 ------------------------------------------------------------------
285 ------------------------------------------------------------------
286 Capturing subpattern count = 0
292 ------------------------------------------------------------------
297 ------------------------------------------------------------------
298 Capturing subpattern count = 0
300 First char = \x{212ab}
303 /-- This one is here not because it's different to Perl, but because the way
304 the captured single-byte is displayed. (In Perl it becomes a character, and you
305 can't tell the difference.) --/
317 /-- This one is here because Perl gives out a grumbly error message (quite
318 correctly, but that messes up comparisons). --/
327 ------------------------------------------------------------------
329 [\x00-`c-\xbf\xf1-\xff] (neg)
332 ------------------------------------------------------------------
333 Capturing subpattern count = 0
337 Subject length lower bound = 1
338 Starting byte set: \x00 \x01 \x02 \x03 \x04 \x05 \x06 \x07 \x08 \x09 \x0a
339 \x0b \x0c \x0d \x0e \x0f \x10 \x11 \x12 \x13 \x14 \x15 \x16 \x17 \x18 \x19
340 \x1a \x1b \x1c \x1d \x1e \x1f \x20 ! " # $ % & ' ( ) * + , - . / 0 1 2 3 4
341 5 6 7 8 9 : ; < = > ? @ A B C D E F G H I J K L M N O P Q R S T U V W X Y
342 Z [ \ ] ^ _ ` c d e f g h i j k l m n o p q r s t u v w x y z { | } ~ \x7f
343 \x80 \x81 \x82 \x83 \x84 \x85 \x86 \x87 \x88 \x89 \x8a \x8b \x8c \x8d \x8e
344 \x8f \x90 \x91 \x92 \x93 \x94 \x95 \x96 \x97 \x98 \x99 \x9a \x9b \x9c \x9d
345 \x9e \x9f \xa0 \xa1 \xa2 \xa3 \xa4 \xa5 \xa6 \xa7 \xa8 \xa9 \xaa \xab \xac
346 \xad \xae \xaf \xb0 \xb1 \xb2 \xb3 \xb4 \xb5 \xb6 \xb7 \xb8 \xb9 \xba \xbb
347 \xbc \xbd \xbe \xbf \xf1 \xf2 \xf3 \xf4 \xf5 \xf6 \xf7 \xf8 \xf9 \xfa \xfb
365 ------------------------------------------------------------------
371 ------------------------------------------------------------------
372 Capturing subpattern count = 0
376 Subject length lower bound = 3
377 No set of starting bytes
378 \x{100}\x{100}\x{100}\x{100\x{100}
379 0: \x{100}\x{100}\x{100}
382 ------------------------------------------------------------------
391 ------------------------------------------------------------------
392 Capturing subpattern count = 1
396 Subject length lower bound = 1
397 Starting byte set: x \xff
400 ------------------------------------------------------------------
410 ------------------------------------------------------------------
411 Capturing subpattern count = 1
415 Subject length lower bound = 1
416 Starting byte set: a x \xff
418 /(\x{100}{0,2}a|x)/8SDZ
419 ------------------------------------------------------------------
429 ------------------------------------------------------------------
430 Capturing subpattern count = 1
434 Subject length lower bound = 1
435 Starting byte set: a x \xff
437 /(\x{100}{1,2}a|x)/8SDZ
438 ------------------------------------------------------------------
449 ------------------------------------------------------------------
450 Capturing subpattern count = 1
454 Subject length lower bound = 1
455 Starting byte set: x \xff
458 ------------------------------------------------------------------
463 ------------------------------------------------------------------
464 Capturing subpattern count = 0
469 /a\x{100}\x{101}*/8DZ
470 ------------------------------------------------------------------
476 ------------------------------------------------------------------
477 Capturing subpattern count = 0
482 /a\x{100}\x{101}+/8DZ
483 ------------------------------------------------------------------
489 ------------------------------------------------------------------
490 Capturing subpattern count = 0
496 ------------------------------------------------------------------
501 ------------------------------------------------------------------
502 Capturing subpattern count = 0
508 ------------------------------------------------------------------
513 ------------------------------------------------------------------
514 Capturing subpattern count = 0
528 ------------------------------------------------------------------
533 ------------------------------------------------------------------
534 Capturing subpattern count = 0
542 ------------------------------------------------------------------
547 ------------------------------------------------------------------
548 Capturing subpattern count = 0
553 /\x{100}abc(xyz(?1))/8DZ
554 ------------------------------------------------------------------
563 ------------------------------------------------------------------
564 Capturing subpattern count = 1
570 Capturing subpattern count = 0
580 ------------------------------------------------------------------
586 ------------------------------------------------------------------
587 Capturing subpattern count = 0
593 ------------------------------------------------------------------
599 ------------------------------------------------------------------
600 Capturing subpattern count = 0
606 Failed: missing terminating ] for character class at offset 13
609 \x{0}\x{d7ff}\x{e000}\x{10ffff}
610 Error -10 (bad UTF-32 string) offset=3 reason=2
612 Error -10 (bad UTF-32 string) offset=0 reason=1
616 Error -10 (bad UTF-32 string) offset=0 reason=1
620 Error -10 (bad UTF-32 string) offset=0 reason=1
624 Error -10 (bad UTF-32 string) offset=0 reason=1
628 Error -10 (bad UTF-32 string) offset=0 reason=1
632 Error -10 (bad UTF-32 string) offset=0 reason=3
634 Error -10 (bad UTF-32 string) offset=0 reason=1
636 Error -10 (bad UTF-32 string) offset=0 reason=2
639 Failed: (*VERB) not recognized at offset 5
642 Capturing subpattern count = 0
644 First char = \x{11234}
650 Failed: (*VERB) not recognized at offset 5
652 /(*CRLF)(*UTF16)(*BSR_UNICODE)a\Rb/I
653 Failed: (*VERB) not recognized at offset 12
655 /(*CRLF)(*UTF32)(*BSR_UNICODE)a\Rb/I
656 Capturing subpattern count = 0
657 Options: bsr_unicode utf
658 Forced newline sequence: CRLF
663 Capturing subpattern count = 0
667 Subject length lower bound = 1
668 Starting byte set: \x09 \x20 \xa0 \xff
689 Capturing subpattern count = 0
693 Subject length lower bound = 1
694 Starting byte set: \x0a \x0b \x0c \x0d \x85 \xff
709 Capturing subpattern count = 0
713 Subject length lower bound = 1
714 Starting byte set: \x09 \x20 A \xa0 \xff
721 Capturing subpattern count = 0
725 Subject length lower bound = 1
726 Starting byte set: \x0a \x0b \x0c \x0d A \x85 \xff
733 Capturing subpattern count = 0
737 Subject length lower bound = 2
738 Starting byte set: \x0a \x0b \x0c \x0d \x85 \xff
741 Capturing subpattern count = 0
745 Subject length lower bound = 4
746 Starting byte set: \x09 \x0a \x0c \x0d \x20 x
749 Capturing subpattern count = 0
753 Subject length lower bound = 5
754 Starting byte set: \x09 \x0a \x0c \x0d \x20 \x85 \xa0
761 Capturing subpattern count = 0
765 Subject length lower bound = 3
766 Starting byte set: \x00 \x01 \x02 \x03 \x04 \x05 \x06 \x07 \x08 \x0b \x0e
767 \x0f \x10 \x11 \x12 \x13 \x14 \x15 \x16 \x17 \x18 \x19 \x1a \x1b \x1c \x1d
768 \x1e \x1f ! " # $ % & ' ( ) * + , - . / 0 1 2 3 4 5 6 7 8 9 : ; < = > ? @
769 A B C D E F G H I J K L M N O P Q R S T U V W X Y Z [ \ ] ^ _ ` a b c d e
770 f g h i j k l m n o p q r s t u v w x y z { | } ~ \x7f \x80 \x81 \x82 \x83
771 \x84 \x86 \x87 \x88 \x89 \x8a \x8b \x8c \x8d \x8e \x8f \x90 \x91 \x92 \x93
772 \x94 \x95 \x96 \x97 \x98 \x99 \x9a \x9b \x9c \x9d \x9e \x9f \xa1 \xa2 \xa3
773 \xa4 \xa5 \xa6 \xa7 \xa8 \xa9 \xaa \xab \xac \xad \xae \xaf \xb0 \xb1 \xb2
774 \xb3 \xb4 \xb5 \xb6 \xb7 \xb8 \xb9 \xba \xbb \xbc \xbd \xbe \xbf \xc0 \xc1
775 \xc2 \xc3 \xc4 \xc5 \xc6 \xc7 \xc8 \xc9 \xca \xcb \xcc \xcd \xce \xcf \xd0
776 \xd1 \xd2 \xd3 \xd4 \xd5 \xd6 \xd7 \xd8 \xd9 \xda \xdb \xdc \xdd \xde \xdf
777 \xe0 \xe1 \xe2 \xe3 \xe4 \xe5 \xe6 \xe7 \xe8 \xe9 \xea \xeb \xec \xed \xee
778 \xef \xf0 \xf1 \xf2 \xf3 \xf4 \xf5 \xf6 \xf7 \xf8 \xf9 \xfa \xfb \xfc \xfd
795 Error -24 (bad offset value)
797 Error -24 (bad offset value)
800 Capturing subpattern count = 0
801 Options: caseless utf
802 First char = \x{1234}
804 Subject length lower bound = 1
805 No set of starting bytes
808 Capturing subpattern count = 0
809 Options: caseless utf
810 First char = \x{1234}
812 Subject length lower bound = 1
813 No set of starting bytes
816 Capturing subpattern count = 0
817 Options: caseless utf
818 First char = \x{1234}
820 Subject length lower bound = 1
821 No set of starting bytes
824 Capturing subpattern count = 0
825 Options: caseless utf
826 First char = \x{1234}
828 Subject length lower bound = 2
829 No set of starting bytes
832 ------------------------------------------------------------------
837 ------------------------------------------------------------------
838 Capturing subpattern count = 0
844 ------------------------------------------------------------------
850 ------------------------------------------------------------------
851 Capturing subpattern count = 0
857 Capturing subpattern count = 0
861 Subject length lower bound = 1
862 Starting byte set: \x0a \x0b \x0c \x0d \x85 \xff
864 /-- Check bad offset --/
876 Error -24 (bad offset value)
878 Error -24 (bad offset value)
881 **Failed: character value is ill-formed UTF-32
884 ------------------------------------------------------------------
890 ------------------------------------------------------------------
895 ------------------------------------------------------------------
901 ------------------------------------------------------------------
906 ------------------------------------------------------------------
912 ------------------------------------------------------------------
917 ------------------------------------------------------------------
923 ------------------------------------------------------------------
928 ------------------------------------------------------------------
934 ------------------------------------------------------------------
939 ------------------------------------------------------------------
945 ------------------------------------------------------------------
950 ------------------------------------------------------------------
957 ------------------------------------------------------------------
962 ------------------------------------------------------------------
969 ------------------------------------------------------------------
974 ------------------------------------------------------------------
980 ------------------------------------------------------------------
985 ------------------------------------------------------------------
991 ------------------------------------------------------------------
996 ------------------------------------------------------------------
1003 ------------------------------------------------------------------
1008 ------------------------------------------------------------------
1015 ------------------------------------------------------------------
1019 /-- End of testinput18 --/