1 # This set of tests is for UTF-16 and UTF-32 support, including Unicode
2 # properties. It is relevant only to the 16-bit and 32-bit libraries. The
3 # output is different for each library, so there are separate output files.
5 /ÃÃÃxxx/IB,utf,no_utf_check
6 ** Failed: invalid UTF-8 string cannot be converted to 32-bit string
10 ** Failed: invalid UTF-8 string cannot be used as input in UTF mode
12 # Check maximum character size
15 ------------------------------------------------------------------
20 ------------------------------------------------------------------
21 Capturing subpattern count = 0
23 First code unit = \x{ffff}
24 Subject length lower bound = 1
27 ------------------------------------------------------------------
32 ------------------------------------------------------------------
33 Capturing subpattern count = 0
35 First code unit = \x{10000}
36 Subject length lower bound = 1
39 ------------------------------------------------------------------
44 ------------------------------------------------------------------
45 Capturing subpattern count = 0
47 First code unit = \x{100}
48 Subject length lower bound = 1
51 ------------------------------------------------------------------
56 ------------------------------------------------------------------
57 Capturing subpattern count = 0
59 First code unit = \x{1000}
60 Subject length lower bound = 1
63 ------------------------------------------------------------------
68 ------------------------------------------------------------------
69 Capturing subpattern count = 0
71 First code unit = \x{10000}
72 Subject length lower bound = 1
75 ------------------------------------------------------------------
80 ------------------------------------------------------------------
81 Capturing subpattern count = 0
83 First code unit = \x{100000}
84 Subject length lower bound = 1
87 ------------------------------------------------------------------
92 ------------------------------------------------------------------
93 Capturing subpattern count = 0
95 First code unit = \x{10ffff}
96 Subject length lower bound = 1
99 ------------------------------------------------------------------
104 ------------------------------------------------------------------
105 Capturing subpattern count = 0
107 First code unit = \xff
108 Subject length lower bound = 1
111 ------------------------------------------------------------------
116 ------------------------------------------------------------------
117 Capturing subpattern count = 0
119 First code unit = \x{100}
120 Subject length lower bound = 1
123 ------------------------------------------------------------------
128 ------------------------------------------------------------------
129 Capturing subpattern count = 0
131 First code unit = \x80
132 Subject length lower bound = 1
135 ------------------------------------------------------------------
140 ------------------------------------------------------------------
141 Capturing subpattern count = 0
143 First code unit = \xff
144 Subject length lower bound = 1
146 /\x{D55c}\x{ad6d}\x{C5B4}/IB,utf
147 ------------------------------------------------------------------
149 \x{d55c}\x{ad6d}\x{c5b4}
152 ------------------------------------------------------------------
153 Capturing subpattern count = 0
155 First code unit = \x{d55c}
156 Last code unit = \x{c5b4}
157 Subject length lower bound = 3
158 \x{D55c}\x{ad6d}\x{C5B4}
159 0: \x{d55c}\x{ad6d}\x{c5b4}
161 /\x{65e5}\x{672c}\x{8a9e}/IB,utf
162 ------------------------------------------------------------------
164 \x{65e5}\x{672c}\x{8a9e}
167 ------------------------------------------------------------------
168 Capturing subpattern count = 0
170 First code unit = \x{65e5}
171 Last code unit = \x{8a9e}
172 Subject length lower bound = 3
173 \x{65e5}\x{672c}\x{8a9e}
174 0: \x{65e5}\x{672c}\x{8a9e}
177 ------------------------------------------------------------------
182 ------------------------------------------------------------------
183 Capturing subpattern count = 0
185 First code unit = \x80
186 Subject length lower bound = 1
189 ------------------------------------------------------------------
194 ------------------------------------------------------------------
195 Capturing subpattern count = 0
197 First code unit = \x84
198 Subject length lower bound = 1
201 ------------------------------------------------------------------
206 ------------------------------------------------------------------
207 Capturing subpattern count = 0
209 First code unit = \x{104}
210 Subject length lower bound = 1
213 ------------------------------------------------------------------
218 ------------------------------------------------------------------
219 Capturing subpattern count = 0
221 First code unit = \x{861}
222 Subject length lower bound = 1
225 ------------------------------------------------------------------
230 ------------------------------------------------------------------
231 Capturing subpattern count = 0
233 First code unit = \x{212ab}
234 Subject length lower bound = 1
236 /[^ab\xC0-\xF0]/IB,utf
237 ------------------------------------------------------------------
239 [\x00-`c-\xbf\xf1-\xff] (neg)
242 ------------------------------------------------------------------
243 Capturing subpattern count = 0
245 Starting code units: \x00 \x01 \x02 \x03 \x04 \x05 \x06 \x07 \x08 \x09 \x0a
246 \x0b \x0c \x0d \x0e \x0f \x10 \x11 \x12 \x13 \x14 \x15 \x16 \x17 \x18 \x19
247 \x1a \x1b \x1c \x1d \x1e \x1f \x20 ! " # $ % & ' ( ) * + , - . / 0 1 2 3 4
248 5 6 7 8 9 : ; < = > ? @ A B C D E F G H I J K L M N O P Q R S T U V W X Y
249 Z [ \ ] ^ _ ` c d e f g h i j k l m n o p q r s t u v w x y z { | } ~ \x7f
250 \x80 \x81 \x82 \x83 \x84 \x85 \x86 \x87 \x88 \x89 \x8a \x8b \x8c \x8d \x8e
251 \x8f \x90 \x91 \x92 \x93 \x94 \x95 \x96 \x97 \x98 \x99 \x9a \x9b \x9c \x9d
252 \x9e \x9f \xa0 \xa1 \xa2 \xa3 \xa4 \xa5 \xa6 \xa7 \xa8 \xa9 \xaa \xab \xac
253 \xad \xae \xaf \xb0 \xb1 \xb2 \xb3 \xb4 \xb5 \xb6 \xb7 \xb8 \xb9 \xba \xbb
254 \xbc \xbd \xbe \xbf \xf1 \xf2 \xf3 \xf4 \xf5 \xf6 \xf7 \xf8 \xf9 \xfa \xfb
256 Subject length lower bound = 1
272 ------------------------------------------------------------------
278 ------------------------------------------------------------------
279 Capturing subpattern count = 0
281 First code unit = \x{100}
282 Last code unit = \x{100}
283 Subject length lower bound = 3
284 \x{100}\x{100}\x{100}\x{100\x{100}
285 0: \x{100}\x{100}\x{100}
288 ------------------------------------------------------------------
297 ------------------------------------------------------------------
298 Capturing subpattern count = 1
300 Starting code units: x \xff
301 Subject length lower bound = 1
303 /(\x{100}*a|x)/IB,utf
304 ------------------------------------------------------------------
314 ------------------------------------------------------------------
315 Capturing subpattern count = 1
317 Starting code units: a x \xff
318 Subject length lower bound = 1
320 /(\x{100}{0,2}a|x)/IB,utf
321 ------------------------------------------------------------------
331 ------------------------------------------------------------------
332 Capturing subpattern count = 1
334 Starting code units: a x \xff
335 Subject length lower bound = 1
337 /(\x{100}{1,2}a|x)/IB,utf
338 ------------------------------------------------------------------
349 ------------------------------------------------------------------
350 Capturing subpattern count = 1
352 Starting code units: x \xff
353 Subject length lower bound = 1
356 ------------------------------------------------------------------
361 ------------------------------------------------------------------
362 Capturing subpattern count = 0
364 First code unit = \x{100}
365 Subject length lower bound = 1
367 /a\x{100}\x{101}*/IB,utf
368 ------------------------------------------------------------------
374 ------------------------------------------------------------------
375 Capturing subpattern count = 0
377 First code unit = 'a'
378 Last code unit = \x{100}
379 Subject length lower bound = 2
381 /a\x{100}\x{101}+/IB,utf
382 ------------------------------------------------------------------
388 ------------------------------------------------------------------
389 Capturing subpattern count = 0
391 First code unit = 'a'
392 Last code unit = \x{101}
393 Subject length lower bound = 3
396 ------------------------------------------------------------------
401 ------------------------------------------------------------------
402 Capturing subpattern count = 0
403 Subject length lower bound = 1
406 ------------------------------------------------------------------
411 ------------------------------------------------------------------
412 Capturing subpattern count = 0
414 First code unit = \x{100}
415 Subject length lower bound = 1
424 ------------------------------------------------------------------
429 ------------------------------------------------------------------
430 Capturing subpattern count = 0
432 First code unit = \xff
433 Subject length lower bound = 1
438 ------------------------------------------------------------------
443 ------------------------------------------------------------------
444 Capturing subpattern count = 0
446 Subject length lower bound = 1
448 /\x{100}abc(xyz(?1))/IB,utf
449 ------------------------------------------------------------------
458 ------------------------------------------------------------------
459 Capturing subpattern count = 1
461 First code unit = \x{100}
463 Subject length lower bound = 7
466 Capturing subpattern count = 0
468 First code unit = \x{1ff}
469 Subject length lower bound = 1
475 /\x{100}+\x{200}/IB,utf
476 ------------------------------------------------------------------
482 ------------------------------------------------------------------
483 Capturing subpattern count = 0
485 First code unit = \x{100}
486 Last code unit = \x{200}
487 Subject length lower bound = 2
490 ------------------------------------------------------------------
496 ------------------------------------------------------------------
497 Capturing subpattern count = 0
499 First code unit = \x{100}
501 Subject length lower bound = 2
504 Failed: error 106 at offset 13: missing terminating ] for character class
507 XX\x{d800}\=no_utf_check
509 XX\x{da00}\=no_utf_check
511 XX\x{dc00}\=no_utf_check
513 XX\x{de00}\=no_utf_check
515 XX\x{dfff}\=no_utf_check
519 Failed: error -27: UTF-32 error: code points 0xd800-0xdfff are not defined at offset 2
521 Failed: error -27: UTF-32 error: code points 0xd800-0xdfff are not defined at offset 2
523 Failed: error -27: UTF-32 error: code points 0xd800-0xdfff are not defined at offset 2
525 Failed: error -27: UTF-32 error: code points 0xd800-0xdfff are not defined at offset 2
527 Failed: error -27: UTF-32 error: code points 0xd800-0xdfff are not defined at offset 2
529 Failed: error -28: UTF-32 error: code points greater than 0x10ffff are not defined at offset 2
531 Failed: error -27: UTF-32 error: code points 0xd800-0xdfff are not defined at offset 2
538 Failed: error -27: UTF-32 error: code points 0xd800-0xdfff are not defined at offset 2
541 Failed: error 160 at offset 5: (*VERB) not recognized or malformed
545 Capturing subpattern count = 0
546 Compile options: <none>
548 First code unit = \x{11234}
549 Subject length lower bound = 1
554 Failed: error 160 at offset 5: (*VERB) not recognized or malformed
558 Failed: error 160 at offset 5: (*VERB) not recognized or malformed
561 /(*CRLF)(*UTF16)(*BSR_UNICODE)a\Rb/I
562 Failed: error 160 at offset 12: (*VERB) not recognized or malformed
564 /(*CRLF)(*UTF32)(*BSR_UNICODE)a\Rb/I
565 Capturing subpattern count = 0
566 Compile options: <none>
568 \R matches any Unicode newline
569 Forced newline is CRLF
570 First code unit = 'a'
572 Subject length lower bound = 3
575 Capturing subpattern count = 0
577 Starting code units: \x09 \x20 \xa0 \xff
578 Subject length lower bound = 1
599 Capturing subpattern count = 0
601 Starting code units: \x0a \x0b \x0c \x0d \x85 \xff
602 Subject length lower bound = 1
617 Capturing subpattern count = 0
619 Starting code units: \x09 \x20 A \xa0 \xff
621 Subject length lower bound = 1
627 /\R*A/I,bsr=unicode,utf
628 Capturing subpattern count = 0
630 \R matches any Unicode newline
631 Starting code units: \x0a \x0b \x0c \x0d A \x85 \xff
633 Subject length lower bound = 1
640 Capturing subpattern count = 0
642 Starting code units: \x0a \x0b \x0c \x0d \x85 \xff
644 Subject length lower bound = 2
647 Capturing subpattern count = 0
649 Starting code units: \x09 \x0a \x0b \x0c \x0d \x20 x
651 Subject length lower bound = 4
653 /\sxxx\s/I,utf,tables=2
654 Capturing subpattern count = 0
656 Starting code units: \x09 \x0a \x0b \x0c \x0d \x20 \x85 \xa0
658 Subject length lower bound = 5
664 /\S \S/I,utf,tables=2
665 Capturing subpattern count = 0
667 Starting code units: \x00 \x01 \x02 \x03 \x04 \x05 \x06 \x07 \x08 \x0e \x0f
668 \x10 \x11 \x12 \x13 \x14 \x15 \x16 \x17 \x18 \x19 \x1a \x1b \x1c \x1d \x1e
669 \x1f ! " # $ % & ' ( ) * + , - . / 0 1 2 3 4 5 6 7 8 9 : ; < = > ? @ A B C
670 D E F G H I J K L M N O P Q R S T U V W X Y Z [ \ ] ^ _ ` a b c d e f g h
671 i j k l m n o p q r s t u v w x y z { | } ~ \x7f \x80 \x81 \x82 \x83 \x84
672 \x86 \x87 \x88 \x89 \x8a \x8b \x8c \x8d \x8e \x8f \x90 \x91 \x92 \x93 \x94
673 \x95 \x96 \x97 \x98 \x99 \x9a \x9b \x9c \x9d \x9e \x9f \xa1 \xa2 \xa3 \xa4
674 \xa5 \xa6 \xa7 \xa8 \xa9 \xaa \xab \xac \xad \xae \xaf \xb0 \xb1 \xb2 \xb3
675 \xb4 \xb5 \xb6 \xb7 \xb8 \xb9 \xba \xbb \xbc \xbd \xbe \xbf \xc0 \xc1 \xc2
676 \xc3 \xc4 \xc5 \xc6 \xc7 \xc8 \xc9 \xca \xcb \xcc \xcd \xce \xcf \xd0 \xd1
677 \xd2 \xd3 \xd4 \xd5 \xd6 \xd7 \xd8 \xd9 \xda \xdb \xdc \xdd \xde \xdf \xe0
678 \xe1 \xe2 \xe3 \xe4 \xe5 \xe6 \xe7 \xe8 \xe9 \xea \xeb \xec \xed \xee \xef
679 \xf0 \xf1 \xf2 \xf3 \xf4 \xf5 \xf6 \xf7 \xf8 \xf9 \xfa \xfb \xfc \xfd \xfe
682 Subject length lower bound = 3
698 \= Expect bad offset error
700 Failed: error -33: bad offset value
702 Failed: error -33: bad offset value
705 Capturing subpattern count = 0
706 Options: caseless utf
707 First code unit = \x{1234}
708 Subject length lower bound = 1
711 Capturing subpattern count = 0
712 Options: caseless utf
713 First code unit = \x{1234}
714 Subject length lower bound = 1
717 Capturing subpattern count = 0
718 Options: caseless utf
719 First code unit = \x{1234}
720 Subject length lower bound = 1
723 Capturing subpattern count = 0
724 Options: caseless utf
725 First code unit = \x{1234}
726 Last code unit = \x{1234}
727 Subject length lower bound = 2
730 ------------------------------------------------------------------
735 ------------------------------------------------------------------
736 Capturing subpattern count = 0
738 Subject length lower bound = 1
741 ------------------------------------------------------------------
747 ------------------------------------------------------------------
748 Capturing subpattern count = 0
750 First code unit = 'X'
751 Last code unit = \x{200}
752 Subject length lower bound = 2
755 Capturing subpattern count = 0
757 Starting code units: \x0a \x0b \x0c \x0d \x85 \xff
758 Subject length lower bound = 1
763 \= Expect bad UTF-16 offset, or no match in 32-bit
766 \x{10000}ab\=offset=1
768 \= Expect 16-bit match, 32-bit no match
769 \x{10000}ab\=offset=2
772 \x{10000}ab\=offset=3
774 \= Expect no match in 16-bit, bad offset in 32-bit
775 \x{10000}ab\=offset=4
776 Failed: error -33: bad offset value
778 \x{10000}ab\=offset=5
779 Failed: error -33: bad offset value
782 Failed: error -27 at offset 0: UTF-32 error: code points 0xd800-0xdfff are not defined
785 ------------------------------------------------------------------
791 ------------------------------------------------------------------
795 /\w+\x{C4}/B,utf,tables=2
796 ------------------------------------------------------------------
802 ------------------------------------------------------------------
807 ------------------------------------------------------------------
813 ------------------------------------------------------------------
817 /\W+\x{C4}/B,utf,tables=2
818 ------------------------------------------------------------------
824 ------------------------------------------------------------------
829 ------------------------------------------------------------------
835 ------------------------------------------------------------------
839 /\W+\x{A1}/B,utf,tables=2
840 ------------------------------------------------------------------
846 ------------------------------------------------------------------
851 ------------------------------------------------------------------
858 ------------------------------------------------------------------
862 /X\s+\x{A0}/B,utf,tables=2
863 ------------------------------------------------------------------
870 ------------------------------------------------------------------
875 ------------------------------------------------------------------
881 ------------------------------------------------------------------
885 /\S+\x{A0}/B,utf,tables=2
886 ------------------------------------------------------------------
892 ------------------------------------------------------------------
897 ------------------------------------------------------------------
904 ------------------------------------------------------------------
908 /\x{a0}+\s!/B,utf,tables=2
909 ------------------------------------------------------------------
916 ------------------------------------------------------------------
921 Failed: error 174 at offset 6: using UTF is disabled by the application
924 Failed: error 174 at offset 0: using UTF is disabled by the application
926 /A\x{391}\x{10427}\x{ff3a}\x{1fb0}/IBi,utf
927 ------------------------------------------------------------------
929 /i A\x{391}\x{10427}\x{ff3a}\x{1fb0}
932 ------------------------------------------------------------------
933 Capturing subpattern count = 0
934 Options: caseless utf
935 First code unit = 'A' (caseless)
936 Last code unit = \x{1fb0} (caseless)
937 Subject length lower bound = 5
939 /A\x{391}\x{10427}\x{ff3a}\x{1fb0}/IB,utf
940 ------------------------------------------------------------------
942 A\x{391}\x{10427}\x{ff3a}\x{1fb0}
945 ------------------------------------------------------------------
946 Capturing subpattern count = 0
948 First code unit = 'A'
949 Last code unit = \x{1fb0}
950 Subject length lower bound = 5
953 ------------------------------------------------------------------
958 ------------------------------------------------------------------
959 Capturing subpattern count = 0
961 First code unit = 'A'
962 Last code unit = \x{1fb0}
963 Subject length lower bound = 3
966 ------------------------------------------------------------------
971 ------------------------------------------------------------------
972 Capturing subpattern count = 0
973 Options: caseless utf
974 First code unit = 'A' (caseless)
975 Last code unit = \x{1fb0} (caseless)
976 Subject length lower bound = 3
978 /\x{401}\x{420}\x{421}\x{422}\x{423}\x{424}\x{425}\x{426}\x{427}\x{428}\x{429}\x{42a}\x{42b}\x{42c}\x{42d}\x{42e}\x{42f}/Ii,utf
979 Capturing subpattern count = 0
980 Options: caseless utf
981 First code unit = \x{401} (caseless)
982 Last code unit = \x{42f} (caseless)
983 Subject length lower bound = 17
984 \x{401}\x{420}\x{421}\x{422}\x{423}\x{424}\x{425}\x{426}\x{427}\x{428}\x{429}\x{42a}\x{42b}\x{42c}\x{42d}\x{42e}\x{42f}
985 0: \x{401}\x{420}\x{421}\x{422}\x{423}\x{424}\x{425}\x{426}\x{427}\x{428}\x{429}\x{42a}\x{42b}\x{42c}\x{42d}\x{42e}\x{42f}
986 \x{451}\x{440}\x{441}\x{442}\x{443}\x{444}\x{445}\x{446}\x{447}\x{448}\x{449}\x{44a}\x{44b}\x{44c}\x{44d}\x{44e}\x{44f}
987 0: \x{451}\x{440}\x{441}\x{442}\x{443}\x{444}\x{445}\x{446}\x{447}\x{448}\x{449}\x{44a}\x{44b}\x{44c}\x{44d}\x{44e}\x{44f}
990 ------------------------------------------------------------------
995 ------------------------------------------------------------------
998 ------------------------------------------------------------------
1003 ------------------------------------------------------------------
1006 ------------------------------------------------------------------
1008 [\x09 \xa0\x{1680}\x{180e}\x{2000}-\x{200a}\x{202f}\x{205f}\x{3000}]
1011 ------------------------------------------------------------------
1014 Capturing subpattern count = 0
1015 Options: caseless utf
1016 Starting code units: K k \xff
1017 Subject length lower bound = 1
1022 Capturing subpattern count = 0
1023 Options: caseless utf
1024 Starting code units: S s \xff
1025 Subject length lower bound = 1
1029 # Non-UTF characters should give errors in both 16-bit and 32-bit modes.
1032 Failed: error 134 at offset 9: character code point value in \x{} or \o{} is too large
1035 Failed: error 134 at offset 10: character code point value in \x{} or \o{} is too large
1038 ------------------------------------------------------------------
1044 ------------------------------------------------------------------
1045 Capturing subpattern count = 0
1047 Starting code units: A \xff
1048 Last code unit = 'A'
1049 Subject length lower bound = 1
1053 /\x{100}*\d(?R)/IB,utf
1054 ------------------------------------------------------------------
1061 ------------------------------------------------------------------
1062 Capturing subpattern count = 0
1064 Starting code units: 0 1 2 3 4 5 6 7 8 9 \xff
1065 Subject length lower bound = 1
1068 ------------------------------------------------------------------
1073 ------------------------------------------------------------------
1074 Capturing subpattern count = 0
1076 Starting code units: Z \xff
1077 Subject length lower bound = 1
1086 ------------------------------------------------------------------
1091 ------------------------------------------------------------------
1092 Capturing subpattern count = 0
1094 Starting code units: z { | } ~ \x7f \x80 \x81 \x82 \x83 \x84 \x85 \x86 \x87
1095 \x88 \x89 \x8a \x8b \x8c \x8d \x8e \x8f \x90 \x91 \x92 \x93 \x94 \x95 \x96
1096 \x97 \x98 \x99 \x9a \x9b \x9c \x9d \x9e \x9f \xa0 \xa1 \xa2 \xa3 \xa4 \xa5
1097 \xa6 \xa7 \xa8 \xa9 \xaa \xab \xac \xad \xae \xaf \xb0 \xb1 \xb2 \xb3 \xb4
1098 \xb5 \xb6 \xb7 \xb8 \xb9 \xba \xbb \xbc \xbd \xbe \xbf \xc0 \xc1 \xc2 \xc3
1099 \xc4 \xc5 \xc6 \xc7 \xc8 \xc9 \xca \xcb \xcc \xcd \xce \xcf \xd0 \xd1 \xd2
1100 \xd3 \xd4 \xd5 \xd6 \xd7 \xd8 \xd9 \xda \xdb \xdc \xdd \xde \xdf \xe0 \xe1
1101 \xe2 \xe3 \xe4 \xe5 \xe6 \xe7 \xe8 \xe9 \xea \xeb \xec \xed \xee \xef \xf0
1102 \xf1 \xf2 \xf3 \xf4 \xf5 \xf6 \xf7 \xf8 \xf9 \xfa \xfb \xfc \xfd \xfe \xff
1103 Subject length lower bound = 1
1105 /[z\Qa-d]Ā\E]/IB,utf
1106 ------------------------------------------------------------------
1111 ------------------------------------------------------------------
1112 Capturing subpattern count = 0
1114 Starting code units: - ] a d z \xff
1115 Subject length lower bound = 1
1121 /[ab\x{100}]abc(xyz(?1))/IB,utf
1122 ------------------------------------------------------------------
1132 ------------------------------------------------------------------
1133 Capturing subpattern count = 1
1135 Starting code units: a b \xff
1136 Last code unit = 'z'
1137 Subject length lower bound = 7
1140 ------------------------------------------------------------------
1146 ------------------------------------------------------------------
1147 Capturing subpattern count = 0
1149 Starting code units: \x09 \x0a \x0b \x0c \x0d \x20 \xff
1150 Subject length lower bound = 1
1153 ------------------------------------------------------------------
1159 ------------------------------------------------------------------
1160 Capturing subpattern count = 0
1162 Starting code units: 0 1 2 3 4 5 6 7 8 9 \xff
1163 Subject length lower bound = 1
1166 ------------------------------------------------------------------
1172 ------------------------------------------------------------------
1173 Capturing subpattern count = 0
1175 Starting code units: 0 1 2 3 4 5 6 7 8 9 A B C D E F G H I J K L M N O P
1176 Q R S T U V W X Y Z _ a b c d e f g h i j k l m n o p q r s t u v w x y z
1178 Subject length lower bound = 1
1181 ------------------------------------------------------------------
1187 ------------------------------------------------------------------
1188 Capturing subpattern count = 0
1190 Starting code units: \x00 \x01 \x02 \x03 \x04 \x05 \x06 \x07 \x08 \x09 \x0a
1191 \x0b \x0c \x0d \x0e \x0f \x10 \x11 \x12 \x13 \x14 \x15 \x16 \x17 \x18 \x19
1192 \x1a \x1b \x1c \x1d \x1e \x1f \x20 ! " # $ % & ' ( ) * + , - . / : ; < = >
1193 ? @ A B C D E F G H I J K L M N O P Q R S T U V W X Y Z [ \ ] ^ _ ` a b c
1194 d e f g h i j k l m n o p q r s t u v w x y z { | } ~ \x7f \x80 \x81 \x82
1195 \x83 \x84 \x85 \x86 \x87 \x88 \x89 \x8a \x8b \x8c \x8d \x8e \x8f \x90 \x91
1196 \x92 \x93 \x94 \x95 \x96 \x97 \x98 \x99 \x9a \x9b \x9c \x9d \x9e \x9f \xa0
1197 \xa1 \xa2 \xa3 \xa4 \xa5 \xa6 \xa7 \xa8 \xa9 \xaa \xab \xac \xad \xae \xaf
1198 \xb0 \xb1 \xb2 \xb3 \xb4 \xb5 \xb6 \xb7 \xb8 \xb9 \xba \xbb \xbc \xbd \xbe
1199 \xbf \xc0 \xc1 \xc2 \xc3 \xc4 \xc5 \xc6 \xc7 \xc8 \xc9 \xca \xcb \xcc \xcd
1200 \xce \xcf \xd0 \xd1 \xd2 \xd3 \xd4 \xd5 \xd6 \xd7 \xd8 \xd9 \xda \xdb \xdc
1201 \xdd \xde \xdf \xe0 \xe1 \xe2 \xe3 \xe4 \xe5 \xe6 \xe7 \xe8 \xe9 \xea \xeb
1202 \xec \xed \xee \xef \xf0 \xf1 \xf2 \xf3 \xf4 \xf5 \xf6 \xf7 \xf8 \xf9 \xfa
1203 \xfb \xfc \xfd \xfe \xff
1204 Subject length lower bound = 1
1207 ------------------------------------------------------------------
1213 ------------------------------------------------------------------
1214 Capturing subpattern count = 0
1216 Starting code units: \x00 \x01 \x02 \x03 \x04 \x05 \x06 \x07 \x08 \x0e \x0f
1217 \x10 \x11 \x12 \x13 \x14 \x15 \x16 \x17 \x18 \x19 \x1a \x1b \x1c \x1d \x1e
1218 \x1f ! " # $ % & ' ( ) * + , - . / 0 1 2 3 4 5 6 7 8 9 : ; < = > ? @ A B C
1219 D E F G H I J K L M N O P Q R S T U V W X Y Z [ \ ] ^ _ ` a b c d e f g h
1220 i j k l m n o p q r s t u v w x y z { | } ~ \x7f \x80 \x81 \x82 \x83 \x84
1221 \x85 \x86 \x87 \x88 \x89 \x8a \x8b \x8c \x8d \x8e \x8f \x90 \x91 \x92 \x93
1222 \x94 \x95 \x96 \x97 \x98 \x99 \x9a \x9b \x9c \x9d \x9e \x9f \xa0 \xa1 \xa2
1223 \xa3 \xa4 \xa5 \xa6 \xa7 \xa8 \xa9 \xaa \xab \xac \xad \xae \xaf \xb0 \xb1
1224 \xb2 \xb3 \xb4 \xb5 \xb6 \xb7 \xb8 \xb9 \xba \xbb \xbc \xbd \xbe \xbf \xc0
1225 \xc1 \xc2 \xc3 \xc4 \xc5 \xc6 \xc7 \xc8 \xc9 \xca \xcb \xcc \xcd \xce \xcf
1226 \xd0 \xd1 \xd2 \xd3 \xd4 \xd5 \xd6 \xd7 \xd8 \xd9 \xda \xdb \xdc \xdd \xde
1227 \xdf \xe0 \xe1 \xe2 \xe3 \xe4 \xe5 \xe6 \xe7 \xe8 \xe9 \xea \xeb \xec \xed
1228 \xee \xef \xf0 \xf1 \xf2 \xf3 \xf4 \xf5 \xf6 \xf7 \xf8 \xf9 \xfa \xfb \xfc
1230 Subject length lower bound = 1
1233 ------------------------------------------------------------------
1239 ------------------------------------------------------------------
1240 Capturing subpattern count = 0
1242 Starting code units: \x00 \x01 \x02 \x03 \x04 \x05 \x06 \x07 \x08 \x09 \x0a
1243 \x0b \x0c \x0d \x0e \x0f \x10 \x11 \x12 \x13 \x14 \x15 \x16 \x17 \x18 \x19
1244 \x1a \x1b \x1c \x1d \x1e \x1f \x20 ! " # $ % & ' ( ) * + , - . / : ; < = >
1245 ? @ [ \ ] ^ ` { | } ~ \x7f \x80 \x81 \x82 \x83 \x84 \x85 \x86 \x87 \x88 \x89
1246 \x8a \x8b \x8c \x8d \x8e \x8f \x90 \x91 \x92 \x93 \x94 \x95 \x96 \x97 \x98
1247 \x99 \x9a \x9b \x9c \x9d \x9e \x9f \xa0 \xa1 \xa2 \xa3 \xa4 \xa5 \xa6 \xa7
1248 \xa8 \xa9 \xaa \xab \xac \xad \xae \xaf \xb0 \xb1 \xb2 \xb3 \xb4 \xb5 \xb6
1249 \xb7 \xb8 \xb9 \xba \xbb \xbc \xbd \xbe \xbf \xc0 \xc1 \xc2 \xc3 \xc4 \xc5
1250 \xc6 \xc7 \xc8 \xc9 \xca \xcb \xcc \xcd \xce \xcf \xd0 \xd1 \xd2 \xd3 \xd4
1251 \xd5 \xd6 \xd7 \xd8 \xd9 \xda \xdb \xdc \xdd \xde \xdf \xe0 \xe1 \xe2 \xe3
1252 \xe4 \xe5 \xe6 \xe7 \xe8 \xe9 \xea \xeb \xec \xed \xee \xef \xf0 \xf1 \xf2
1253 \xf3 \xf4 \xf5 \xf6 \xf7 \xf8 \xf9 \xfa \xfb \xfc \xfd \xfe \xff
1254 Subject length lower bound = 1
1256 /[\x{105}-\x{109}]/IBi,utf
1257 ------------------------------------------------------------------
1262 ------------------------------------------------------------------
1263 Capturing subpattern count = 0
1264 Options: caseless utf
1265 Starting code units: \xff
1266 Subject length lower bound = 1
1279 /[z-\x{100}]/IBi,utf
1280 ------------------------------------------------------------------
1282 [Zz-\xff\x{39c}\x{3bc}\x{212b}\x{1e9e}\x{212b}\x{178}\x{100}-\x{101}]
1285 ------------------------------------------------------------------
1286 Capturing subpattern count = 0
1287 Options: caseless utf
1288 Starting code units: Z z { | } ~ \x7f \x80 \x81 \x82 \x83 \x84 \x85 \x86
1289 \x87 \x88 \x89 \x8a \x8b \x8c \x8d \x8e \x8f \x90 \x91 \x92 \x93 \x94 \x95
1290 \x96 \x97 \x98 \x99 \x9a \x9b \x9c \x9d \x9e \x9f \xa0 \xa1 \xa2 \xa3 \xa4
1291 \xa5 \xa6 \xa7 \xa8 \xa9 \xaa \xab \xac \xad \xae \xaf \xb0 \xb1 \xb2 \xb3
1292 \xb4 \xb5 \xb6 \xb7 \xb8 \xb9 \xba \xbb \xbc \xbd \xbe \xbf \xc0 \xc1 \xc2
1293 \xc3 \xc4 \xc5 \xc6 \xc7 \xc8 \xc9 \xca \xcb \xcc \xcd \xce \xcf \xd0 \xd1
1294 \xd2 \xd3 \xd4 \xd5 \xd6 \xd7 \xd8 \xd9 \xda \xdb \xdc \xdd \xde \xdf \xe0
1295 \xe1 \xe2 \xe3 \xe4 \xe5 \xe6 \xe7 \xe8 \xe9 \xea \xeb \xec \xed \xee \xef
1296 \xf0 \xf1 \xf2 \xf3 \xf4 \xf5 \xf6 \xf7 \xf8 \xf9 \xfa \xfb \xfc \xfd \xfe
1298 Subject length lower bound = 1
1325 /[z-\x{100}]/IBi,utf
1326 ------------------------------------------------------------------
1328 [Zz-\xff\x{39c}\x{3bc}\x{212b}\x{1e9e}\x{212b}\x{178}\x{100}-\x{101}]
1331 ------------------------------------------------------------------
1332 Capturing subpattern count = 0
1333 Options: caseless utf
1334 Starting code units: Z z { | } ~ \x7f \x80 \x81 \x82 \x83 \x84 \x85 \x86
1335 \x87 \x88 \x89 \x8a \x8b \x8c \x8d \x8e \x8f \x90 \x91 \x92 \x93 \x94 \x95
1336 \x96 \x97 \x98 \x99 \x9a \x9b \x9c \x9d \x9e \x9f \xa0 \xa1 \xa2 \xa3 \xa4
1337 \xa5 \xa6 \xa7 \xa8 \xa9 \xaa \xab \xac \xad \xae \xaf \xb0 \xb1 \xb2 \xb3
1338 \xb4 \xb5 \xb6 \xb7 \xb8 \xb9 \xba \xbb \xbc \xbd \xbe \xbf \xc0 \xc1 \xc2
1339 \xc3 \xc4 \xc5 \xc6 \xc7 \xc8 \xc9 \xca \xcb \xcc \xcd \xce \xcf \xd0 \xd1
1340 \xd2 \xd3 \xd4 \xd5 \xd6 \xd7 \xd8 \xd9 \xda \xdb \xdc \xdd \xde \xdf \xe0
1341 \xe1 \xe2 \xe3 \xe4 \xe5 \xe6 \xe7 \xe8 \xe9 \xea \xeb \xec \xed \xee \xef
1342 \xf0 \xf1 \xf2 \xf3 \xf4 \xf5 \xf6 \xf7 \xf8 \xf9 \xfa \xfb \xfc \xfd \xfe
1344 Subject length lower bound = 1
1347 ------------------------------------------------------------------
1349 clist 03a3 03c2 03c3
1353 ------------------------------------------------------------------
1354 Capturing subpattern count = 0
1355 Options: caseless utf
1356 Starting code units: \xff
1357 Last code unit = 'B' (caseless)
1358 Subject length lower bound = 2
1362 Failed: error -28: UTF-32 error: code points greater than 0x10ffff are not defined at offset 0
1365 ------------------------------------------------------------------
1367 ab\x{fd}\x{bf}\x{bf}\x{bf}\x{bf}\x{bf}z
1370 ------------------------------------------------------------------
1373 ** Failed: character value greater than 0x10ffff cannot be converted to UTF
1376 ------------------------------------------------------------------
1378 [\x00-/:-@[-^`{-\xff\p{Any}\x{100}-\x{ffffffff}]
1381 ------------------------------------------------------------------
1388 ------------------------------------------------------------------
1390 [\x00-/:-@[-^`{-\xff\p{L}\x{100}-\x{ffffffff}]
1393 ------------------------------------------------------------------
1404 /[\s[:^ascii:]]/B,ucp
1405 ------------------------------------------------------------------
1407 [\x80-\xff\p{Xsp}\x{100}-\x{ffffffff}]
1410 ------------------------------------------------------------------
1416 # A special extra option allows excaped surrogate code points in 32-bit mode,
1417 # but subjects containing them must not be UTF-checked. These patterns give
1418 # errors in 16-bit mode.
1420 /\x{d800}/I,utf,allow_surrogate_escapes
1421 Capturing subpattern count = 0
1423 Extra options: allow_surrogate_escapes
1424 First code unit = \x{d800}
1425 Subject length lower bound = 1
1426 \x{d800}\=no_utf_check
1429 /\udfff\o{157401}/utf,alt_bsux,allow_surrogate_escapes
1430 \x{dfff}\x{df01}\=no_utf_check
1433 # This has different starting code units in 8-bit mode.
1436 ------------------------------------------------------------------
1439 [\x00-`c-\xff] (neg)
1442 ------------------------------------------------------------------
1443 Capturing subpattern count = 0
1444 Compile options: utf
1445 Overall options: anchored utf
1446 Starting code units: \x00 \x01 \x02 \x03 \x04 \x05 \x06 \x07 \x08 \x09 \x0a
1447 \x0b \x0c \x0d \x0e \x0f \x10 \x11 \x12 \x13 \x14 \x15 \x16 \x17 \x18 \x19
1448 \x1a \x1b \x1c \x1d \x1e \x1f \x20 ! " # $ % & ' ( ) * + , - . / 0 1 2 3 4
1449 5 6 7 8 9 : ; < = > ? @ A B C D E F G H I J K L M N O P Q R S T U V W X Y
1450 Z [ \ ] ^ _ ` c d e f g h i j k l m n o p q r s t u v w x y z { | } ~ \x7f
1451 \x80 \x81 \x82 \x83 \x84 \x85 \x86 \x87 \x88 \x89 \x8a \x8b \x8c \x8d \x8e
1452 \x8f \x90 \x91 \x92 \x93 \x94 \x95 \x96 \x97 \x98 \x99 \x9a \x9b \x9c \x9d
1453 \x9e \x9f \xa0 \xa1 \xa2 \xa3 \xa4 \xa5 \xa6 \xa7 \xa8 \xa9 \xaa \xab \xac
1454 \xad \xae \xaf \xb0 \xb1 \xb2 \xb3 \xb4 \xb5 \xb6 \xb7 \xb8 \xb9 \xba \xbb
1455 \xbc \xbd \xbe \xbf \xc0 \xc1 \xc2 \xc3 \xc4 \xc5 \xc6 \xc7 \xc8 \xc9 \xca
1456 \xcb \xcc \xcd \xce \xcf \xd0 \xd1 \xd2 \xd3 \xd4 \xd5 \xd6 \xd7 \xd8 \xd9
1457 \xda \xdb \xdc \xdd \xde \xdf \xe0 \xe1 \xe2 \xe3 \xe4 \xe5 \xe6 \xe7 \xe8
1458 \xe9 \xea \xeb \xec \xed \xee \xef \xf0 \xf1 \xf2 \xf3 \xf4 \xf5 \xf6 \xf7
1459 \xf8 \xf9 \xfa \xfb \xfc \xfd \xfe \xff
1460 Subject length lower bound = 1
1471 # End of testinput12