1 /-- This set of tests is for UTF-16 and UTF-32 support, and is relevant only to
2 the 16- and 32-bit libraries. --/
7 **Failed: invalid UTF-8 string cannot be converted to UTF-32
11 **Failed: invalid UTF-8 string cannot be used as input in UTF mode
45 0: X\x{11234}\x{512}YZ
46 X\x{11234}\x{512}\x{11234}Z
47 0: X\x{11234}\x{512}\x{11234}Z
73 0: a\x{12257}\x{11234}b
83 /-- Check maximum character size --/
86 ------------------------------------------------------------------
91 ------------------------------------------------------------------
92 Capturing subpattern count = 0
98 ------------------------------------------------------------------
103 ------------------------------------------------------------------
104 Capturing subpattern count = 0
106 First char = \x{10000}
110 ------------------------------------------------------------------
115 ------------------------------------------------------------------
116 Capturing subpattern count = 0
122 ------------------------------------------------------------------
127 ------------------------------------------------------------------
128 Capturing subpattern count = 0
130 First char = \x{1000}
134 ------------------------------------------------------------------
139 ------------------------------------------------------------------
140 Capturing subpattern count = 0
142 First char = \x{10000}
146 ------------------------------------------------------------------
151 ------------------------------------------------------------------
152 Capturing subpattern count = 0
154 First char = \x{100000}
158 ------------------------------------------------------------------
163 ------------------------------------------------------------------
164 Capturing subpattern count = 0
166 First char = \x{10ffff}
170 ------------------------------------------------------------------
175 ------------------------------------------------------------------
176 Capturing subpattern count = 0
182 ------------------------------------------------------------------
187 ------------------------------------------------------------------
188 Capturing subpattern count = 0
194 ------------------------------------------------------------------
199 ------------------------------------------------------------------
200 Capturing subpattern count = 0
206 ------------------------------------------------------------------
211 ------------------------------------------------------------------
212 Capturing subpattern count = 0
217 /\x{D55c}\x{ad6d}\x{C5B4}/DZ8
218 ------------------------------------------------------------------
220 \x{d55c}\x{ad6d}\x{c5b4}
223 ------------------------------------------------------------------
224 Capturing subpattern count = 0
226 First char = \x{d55c}
228 \x{D55c}\x{ad6d}\x{C5B4}
229 0: \x{d55c}\x{ad6d}\x{c5b4}
231 /\x{65e5}\x{672c}\x{8a9e}/DZ8
232 ------------------------------------------------------------------
234 \x{65e5}\x{672c}\x{8a9e}
237 ------------------------------------------------------------------
238 Capturing subpattern count = 0
240 First char = \x{65e5}
242 \x{65e5}\x{672c}\x{8a9e}
243 0: \x{65e5}\x{672c}\x{8a9e}
246 ------------------------------------------------------------------
251 ------------------------------------------------------------------
252 Capturing subpattern count = 0
258 ------------------------------------------------------------------
263 ------------------------------------------------------------------
264 Capturing subpattern count = 0
270 ------------------------------------------------------------------
275 ------------------------------------------------------------------
276 Capturing subpattern count = 0
282 ------------------------------------------------------------------
287 ------------------------------------------------------------------
288 Capturing subpattern count = 0
294 ------------------------------------------------------------------
299 ------------------------------------------------------------------
300 Capturing subpattern count = 0
302 First char = \x{212ab}
305 /-- This one is here not because it's different to Perl, but because the way
306 the captured single-byte is displayed. (In Perl it becomes a character, and you
307 can't tell the difference.) --/
319 /-- This one is here because Perl gives out a grumbly error message (quite
320 correctly, but that messes up comparisons). --/
329 ------------------------------------------------------------------
331 [\x00-`c-\xbf\xf1-\xff] (neg)
334 ------------------------------------------------------------------
335 Capturing subpattern count = 0
339 Subject length lower bound = 1
340 Starting chars: \x00 \x01 \x02 \x03 \x04 \x05 \x06 \x07 \x08 \x09 \x0a
341 \x0b \x0c \x0d \x0e \x0f \x10 \x11 \x12 \x13 \x14 \x15 \x16 \x17 \x18 \x19
342 \x1a \x1b \x1c \x1d \x1e \x1f \x20 ! " # $ % & ' ( ) * + , - . / 0 1 2 3 4
343 5 6 7 8 9 : ; < = > ? @ A B C D E F G H I J K L M N O P Q R S T U V W X Y
344 Z [ \ ] ^ _ ` c d e f g h i j k l m n o p q r s t u v w x y z { | } ~ \x7f
345 \x80 \x81 \x82 \x83 \x84 \x85 \x86 \x87 \x88 \x89 \x8a \x8b \x8c \x8d \x8e
346 \x8f \x90 \x91 \x92 \x93 \x94 \x95 \x96 \x97 \x98 \x99 \x9a \x9b \x9c \x9d
347 \x9e \x9f \xa0 \xa1 \xa2 \xa3 \xa4 \xa5 \xa6 \xa7 \xa8 \xa9 \xaa \xab \xac
348 \xad \xae \xaf \xb0 \xb1 \xb2 \xb3 \xb4 \xb5 \xb6 \xb7 \xb8 \xb9 \xba \xbb
349 \xbc \xbd \xbe \xbf \xf1 \xf2 \xf3 \xf4 \xf5 \xf6 \xf7 \xf8 \xf9 \xfa \xfb
367 ------------------------------------------------------------------
373 ------------------------------------------------------------------
374 Capturing subpattern count = 0
378 Subject length lower bound = 3
379 No starting char list
380 \x{100}\x{100}\x{100}\x{100\x{100}
381 0: \x{100}\x{100}\x{100}
384 ------------------------------------------------------------------
393 ------------------------------------------------------------------
394 Capturing subpattern count = 1
398 Subject length lower bound = 1
399 Starting chars: x \xff
402 ------------------------------------------------------------------
412 ------------------------------------------------------------------
413 Capturing subpattern count = 1
417 Subject length lower bound = 1
418 Starting chars: a x \xff
420 /(\x{100}{0,2}a|x)/8SDZ
421 ------------------------------------------------------------------
431 ------------------------------------------------------------------
432 Capturing subpattern count = 1
436 Subject length lower bound = 1
437 Starting chars: a x \xff
439 /(\x{100}{1,2}a|x)/8SDZ
440 ------------------------------------------------------------------
451 ------------------------------------------------------------------
452 Capturing subpattern count = 1
456 Subject length lower bound = 1
457 Starting chars: x \xff
460 ------------------------------------------------------------------
465 ------------------------------------------------------------------
466 Capturing subpattern count = 0
471 /a\x{100}\x{101}*/8DZ
472 ------------------------------------------------------------------
478 ------------------------------------------------------------------
479 Capturing subpattern count = 0
484 /a\x{100}\x{101}+/8DZ
485 ------------------------------------------------------------------
491 ------------------------------------------------------------------
492 Capturing subpattern count = 0
498 ------------------------------------------------------------------
503 ------------------------------------------------------------------
504 Capturing subpattern count = 0
510 ------------------------------------------------------------------
515 ------------------------------------------------------------------
516 Capturing subpattern count = 0
530 ------------------------------------------------------------------
535 ------------------------------------------------------------------
536 Capturing subpattern count = 0
544 ------------------------------------------------------------------
549 ------------------------------------------------------------------
550 Capturing subpattern count = 0
555 /\x{100}abc(xyz(?1))/8DZ
556 ------------------------------------------------------------------
565 ------------------------------------------------------------------
566 Capturing subpattern count = 1
572 Capturing subpattern count = 0
582 ------------------------------------------------------------------
588 ------------------------------------------------------------------
589 Capturing subpattern count = 0
595 ------------------------------------------------------------------
601 ------------------------------------------------------------------
602 Capturing subpattern count = 0
608 Failed: missing terminating ] for character class at offset 13
612 Error -10 (bad UTF-32 string) offset=0 reason=1
616 Error -10 (bad UTF-32 string) offset=0 reason=1
620 Error -10 (bad UTF-32 string) offset=0 reason=1
624 Error -10 (bad UTF-32 string) offset=0 reason=1
628 Error -10 (bad UTF-32 string) offset=0 reason=1
632 Error -10 (bad UTF-32 string) offset=0 reason=3
634 Error -10 (bad UTF-32 string) offset=0 reason=1
637 Failed: (*VERB) not recognized or malformed at offset 5
640 Capturing subpattern count = 0
642 First char = \x{11234}
648 Failed: (*VERB) not recognized or malformed at offset 5
650 /(*CRLF)(*UTF16)(*BSR_UNICODE)a\Rb/I
651 Failed: (*VERB) not recognized or malformed at offset 12
653 /(*CRLF)(*UTF32)(*BSR_UNICODE)a\Rb/I
654 Capturing subpattern count = 0
655 Options: bsr_unicode utf
656 Forced newline sequence: CRLF
661 Capturing subpattern count = 0
665 Subject length lower bound = 1
666 Starting chars: \x09 \x20 \xa0 \xff
687 Capturing subpattern count = 0
691 Subject length lower bound = 1
692 Starting chars: \x0a \x0b \x0c \x0d \x85 \xff
707 Capturing subpattern count = 0
711 Subject length lower bound = 1
712 Starting chars: \x09 \x20 A \xa0 \xff
718 /\R*A/SI8<bsr_unicode>
719 Capturing subpattern count = 0
720 Options: bsr_unicode utf
723 Subject length lower bound = 1
724 Starting chars: \x0a \x0b \x0c \x0d A \x85 \xff
731 Capturing subpattern count = 0
735 Subject length lower bound = 2
736 Starting chars: \x0a \x0b \x0c \x0d \x85 \xff
739 Capturing subpattern count = 0
743 Subject length lower bound = 4
744 Starting chars: \x09 \x0a \x0b \x0c \x0d \x20 x
747 Capturing subpattern count = 0
751 Subject length lower bound = 5
752 Starting chars: \x09 \x0a \x0b \x0c \x0d \x20 \x85 \xa0
759 Capturing subpattern count = 0
763 Subject length lower bound = 3
764 Starting chars: \x00 \x01 \x02 \x03 \x04 \x05 \x06 \x07 \x08 \x0e \x0f
765 \x10 \x11 \x12 \x13 \x14 \x15 \x16 \x17 \x18 \x19 \x1a \x1b \x1c \x1d \x1e
766 \x1f ! " # $ % & ' ( ) * + , - . / 0 1 2 3 4 5 6 7 8 9 : ; < = > ? @ A B C
767 D E F G H I J K L M N O P Q R S T U V W X Y Z [ \ ] ^ _ ` a b c d e f g h
768 i j k l m n o p q r s t u v w x y z { | } ~ \x7f \x80 \x81 \x82 \x83 \x84
769 \x86 \x87 \x88 \x89 \x8a \x8b \x8c \x8d \x8e \x8f \x90 \x91 \x92 \x93 \x94
770 \x95 \x96 \x97 \x98 \x99 \x9a \x9b \x9c \x9d \x9e \x9f \xa1 \xa2 \xa3 \xa4
771 \xa5 \xa6 \xa7 \xa8 \xa9 \xaa \xab \xac \xad \xae \xaf \xb0 \xb1 \xb2 \xb3
772 \xb4 \xb5 \xb6 \xb7 \xb8 \xb9 \xba \xbb \xbc \xbd \xbe \xbf \xc0 \xc1 \xc2
773 \xc3 \xc4 \xc5 \xc6 \xc7 \xc8 \xc9 \xca \xcb \xcc \xcd \xce \xcf \xd0 \xd1
774 \xd2 \xd3 \xd4 \xd5 \xd6 \xd7 \xd8 \xd9 \xda \xdb \xdc \xdd \xde \xdf \xe0
775 \xe1 \xe2 \xe3 \xe4 \xe5 \xe6 \xe7 \xe8 \xe9 \xea \xeb \xec \xed \xee \xef
776 \xf0 \xf1 \xf2 \xf3 \xf4 \xf5 \xf6 \xf7 \xf8 \xf9 \xfa \xfb \xfc \xfd \xfe
793 Error -24 (bad offset value)
795 Error -24 (bad offset value)
798 Capturing subpattern count = 0
799 Options: caseless utf
800 First char = \x{1234}
802 Subject length lower bound = 1
803 No starting char list
806 Capturing subpattern count = 0
807 Options: caseless utf
808 First char = \x{1234}
810 Subject length lower bound = 1
811 No starting char list
814 Capturing subpattern count = 0
815 Options: caseless utf
816 First char = \x{1234}
818 Subject length lower bound = 1
819 No starting char list
822 Capturing subpattern count = 0
823 Options: caseless utf
824 First char = \x{1234}
826 Subject length lower bound = 2
827 No starting char list
830 ------------------------------------------------------------------
835 ------------------------------------------------------------------
836 Capturing subpattern count = 0
842 ------------------------------------------------------------------
848 ------------------------------------------------------------------
849 Capturing subpattern count = 0
855 Capturing subpattern count = 0
859 Subject length lower bound = 1
860 Starting chars: \x0a \x0b \x0c \x0d \x85 \xff
862 /-- Check bad offset --/
874 Error -24 (bad offset value)
876 Error -24 (bad offset value)
879 **Failed: character value is ill-formed UTF-32
882 ------------------------------------------------------------------
888 ------------------------------------------------------------------
893 ------------------------------------------------------------------
899 ------------------------------------------------------------------
904 ------------------------------------------------------------------
910 ------------------------------------------------------------------
915 ------------------------------------------------------------------
921 ------------------------------------------------------------------
926 ------------------------------------------------------------------
932 ------------------------------------------------------------------
937 ------------------------------------------------------------------
943 ------------------------------------------------------------------
948 ------------------------------------------------------------------
955 ------------------------------------------------------------------
960 ------------------------------------------------------------------
967 ------------------------------------------------------------------
972 ------------------------------------------------------------------
978 ------------------------------------------------------------------
983 ------------------------------------------------------------------
989 ------------------------------------------------------------------
994 ------------------------------------------------------------------
1001 ------------------------------------------------------------------
1006 ------------------------------------------------------------------
1013 ------------------------------------------------------------------
1018 Failed: setting UTF is disabled by the application at offset 0
1021 Failed: setting UTF is disabled by the application at offset 0
1023 /-- End of testinput18 --/