/[pcre]/code/trunk/testdata/testoutput15
ViewVC logotype

Diff of /code/trunk/testdata/testoutput15

Parent Directory Parent Directory | Revision Log Revision Log | View Patch Patch

revision 689 by ph10, Fri Sep 9 10:34:57 2011 UTC revision 1174 by chpe, Wed Oct 24 21:29:12 2012 UTC
# Line 1  Line 1 
1  /-- This test is run only when JIT support is not available. It checks that an  /-- This set of tests is for UTF-8 support, and is relevant only to the 8-bit
2  attempt to use it has the expected behaviour. It also tests things that      library. --/
3  are different without JIT. --/  
4    /X(\C{3})/8
5  /abc/S+I      X\x{1234}
6     0: X\x{1234}
7     1: \x{1234}
8    
9    /X(\C{4})/8
10        X\x{1234}YZ
11     0: X\x{1234}Y
12     1: \x{1234}Y
13    
14    /X\C*/8
15        XYZabcdce
16     0: XYZabcdce
17    
18    /X\C*?/8
19        XYZabcde
20     0: X
21    
22    /X\C{3,5}/8
23        Xabcdefg
24     0: Xabcde
25        X\x{1234}
26     0: X\x{1234}
27        X\x{1234}YZ
28     0: X\x{1234}YZ
29        X\x{1234}\x{512}
30     0: X\x{1234}\x{512}
31        X\x{1234}\x{512}YZ
32     0: X\x{1234}\x{512}
33    
34    /X\C{3,5}?/8
35        Xabcdefg
36     0: Xabc
37        X\x{1234}
38     0: X\x{1234}
39        X\x{1234}YZ
40     0: X\x{1234}
41        X\x{1234}\x{512}
42     0: X\x{1234}
43    
44    /a\Cb/8
45        aXb
46     0: aXb
47        a\nb
48     0: a\x{0a}b
49    
50    /a\C\Cb/8
51        a\x{100}b
52     0: a\x{100}b
53    
54    /ab\Cde/8
55        abXde
56     0: abXde
57    
58    /a\C\Cb/8
59        a\x{100}b
60     0: a\x{100}b
61        ** Failers
62    No match
63        a\x{12257}b
64    No match
65    
66    /[]/8
67    Failed: invalid UTF-8 string at offset 1
68    
69    //8
70    Failed: invalid UTF-8 string at offset 0
71    
72    /xxx/8
73    Failed: invalid UTF-8 string at offset 0
74    
75    /xxx/8?DZSS
76    ------------------------------------------------------------------
77            Bra
78            \X{c0}\X{c0}\X{c0}xxx
79            Ket
80            End
81    ------------------------------------------------------------------
82  Capturing subpattern count = 0  Capturing subpattern count = 0
83  No options  Options: utf no_utf_check
84  First char = 'a'  First char = \x{c3}
85  Need char = 'c'  Need char = 'x'
86    
87    /abc/8
88        \xdf
89    Error -10 (bad UTF-8 string) offset=0 reason=1
90        \xef
91    Error -10 (bad UTF-8 string) offset=0 reason=2
92        \xef\x80
93    Error -10 (bad UTF-8 string) offset=0 reason=1
94        \xf7
95    Error -10 (bad UTF-8 string) offset=0 reason=3
96        \xf7\x80
97    Error -10 (bad UTF-8 string) offset=0 reason=2
98        \xf7\x80\x80
99    Error -10 (bad UTF-8 string) offset=0 reason=1
100        \xfb
101    Error -10 (bad UTF-8 string) offset=0 reason=4
102        \xfb\x80
103    Error -10 (bad UTF-8 string) offset=0 reason=3
104        \xfb\x80\x80
105    Error -10 (bad UTF-8 string) offset=0 reason=2
106        \xfb\x80\x80\x80
107    Error -10 (bad UTF-8 string) offset=0 reason=1
108        \xfd
109    Error -10 (bad UTF-8 string) offset=0 reason=5
110        \xfd\x80
111    Error -10 (bad UTF-8 string) offset=0 reason=4
112        \xfd\x80\x80
113    Error -10 (bad UTF-8 string) offset=0 reason=3
114        \xfd\x80\x80\x80
115    Error -10 (bad UTF-8 string) offset=0 reason=2
116        \xfd\x80\x80\x80\x80
117    Error -10 (bad UTF-8 string) offset=0 reason=1
118        \xdf\x7f
119    Error -10 (bad UTF-8 string) offset=0 reason=6
120        \xef\x7f\x80
121    Error -10 (bad UTF-8 string) offset=0 reason=6
122        \xef\x80\x7f
123    Error -10 (bad UTF-8 string) offset=0 reason=7
124        \xf7\x7f\x80\x80
125    Error -10 (bad UTF-8 string) offset=0 reason=6
126        \xf7\x80\x7f\x80
127    Error -10 (bad UTF-8 string) offset=0 reason=7
128        \xf7\x80\x80\x7f
129    Error -10 (bad UTF-8 string) offset=0 reason=8
130        \xfb\x7f\x80\x80\x80
131    Error -10 (bad UTF-8 string) offset=0 reason=6
132        \xfb\x80\x7f\x80\x80
133    Error -10 (bad UTF-8 string) offset=0 reason=7
134        \xfb\x80\x80\x7f\x80
135    Error -10 (bad UTF-8 string) offset=0 reason=8
136        \xfb\x80\x80\x80\x7f
137    Error -10 (bad UTF-8 string) offset=0 reason=9
138        \xfd\x7f\x80\x80\x80\x80
139    Error -10 (bad UTF-8 string) offset=0 reason=6
140        \xfd\x80\x7f\x80\x80\x80
141    Error -10 (bad UTF-8 string) offset=0 reason=7
142        \xfd\x80\x80\x7f\x80\x80
143    Error -10 (bad UTF-8 string) offset=0 reason=8
144        \xfd\x80\x80\x80\x7f\x80
145    Error -10 (bad UTF-8 string) offset=0 reason=9
146        \xfd\x80\x80\x80\x80\x7f
147    Error -10 (bad UTF-8 string) offset=0 reason=10
148        \xed\xa0\x80
149    Error -10 (bad UTF-8 string) offset=0 reason=14
150        \xc0\x8f
151    Error -10 (bad UTF-8 string) offset=0 reason=15
152        \xe0\x80\x8f
153    Error -10 (bad UTF-8 string) offset=0 reason=16
154        \xf0\x80\x80\x8f
155    Error -10 (bad UTF-8 string) offset=0 reason=17
156        \xf8\x80\x80\x80\x8f
157    Error -10 (bad UTF-8 string) offset=0 reason=18
158        \xfc\x80\x80\x80\x80\x8f
159    Error -10 (bad UTF-8 string) offset=0 reason=19
160        \x80
161    Error -10 (bad UTF-8 string) offset=0 reason=20
162        \xfe
163    Error -10 (bad UTF-8 string) offset=0 reason=21
164        \xff
165    Error -10 (bad UTF-8 string) offset=0 reason=21
166        \xef\xb7\x90
167    Error -10 (bad UTF-8 string) offset=0 reason=22
168    
169    /abc/8
170        \xfb\x80\x80\x80\x80
171    Error -10 (bad UTF-8 string) offset=0 reason=11
172        \xfd\x80\x80\x80\x80\x80
173    Error -10 (bad UTF-8 string) offset=0 reason=12
174        \xf7\xbf\xbf\xbf
175    Error -10 (bad UTF-8 string) offset=0 reason=13
176    
177    /anything/8
178        \xc0\x80
179    Error -10 (bad UTF-8 string) offset=0 reason=15
180        \xc1\x8f
181    Error -10 (bad UTF-8 string) offset=0 reason=15
182        \xe0\x9f\x80
183    Error -10 (bad UTF-8 string) offset=0 reason=16
184        \xf0\x8f\x80\x80
185    Error -10 (bad UTF-8 string) offset=0 reason=17
186        \xf8\x87\x80\x80\x80
187    Error -10 (bad UTF-8 string) offset=0 reason=18
188        \xfc\x83\x80\x80\x80\x80
189    Error -10 (bad UTF-8 string) offset=0 reason=19
190        \xfe\x80\x80\x80\x80\x80
191    Error -10 (bad UTF-8 string) offset=0 reason=21
192        \xff\x80\x80\x80\x80\x80
193    Error -10 (bad UTF-8 string) offset=0 reason=21
194        \xc3\x8f
195    No match
196        \xe0\xaf\x80
197    No match
198        \xe1\x80\x80
199    No match
200        \xf0\x9f\x80\x80
201    No match
202        \xf1\x8f\x80\x80
203    No match
204        \xf8\x88\x80\x80\x80
205    Error -10 (bad UTF-8 string) offset=0 reason=11
206        \xf9\x87\x80\x80\x80
207    Error -10 (bad UTF-8 string) offset=0 reason=11
208        \xfc\x84\x80\x80\x80\x80
209    Error -10 (bad UTF-8 string) offset=0 reason=12
210        \xfd\x83\x80\x80\x80\x80
211    Error -10 (bad UTF-8 string) offset=0 reason=12
212        \?\xf8\x88\x80\x80\x80
213    No match
214        \?\xf9\x87\x80\x80\x80
215    No match
216        \?\xfc\x84\x80\x80\x80\x80
217    No match
218        \?\xfd\x83\x80\x80\x80\x80
219    No match
220    
221    /noncharacter/8
222        \x{fffe}
223    Error -10 (bad UTF-8 string) offset=0 reason=22
224        \x{ffff}
225    Error -10 (bad UTF-8 string) offset=0 reason=22
226        \x{1fffe}
227    Error -10 (bad UTF-8 string) offset=0 reason=22
228        \x{1ffff}
229    Error -10 (bad UTF-8 string) offset=0 reason=22
230        \x{2fffe}
231    Error -10 (bad UTF-8 string) offset=0 reason=22
232        \x{2ffff}
233    Error -10 (bad UTF-8 string) offset=0 reason=22
234        \x{3fffe}
235    Error -10 (bad UTF-8 string) offset=0 reason=22
236        \x{3ffff}
237    Error -10 (bad UTF-8 string) offset=0 reason=22
238        \x{4fffe}
239    Error -10 (bad UTF-8 string) offset=0 reason=22
240        \x{4ffff}
241    Error -10 (bad UTF-8 string) offset=0 reason=22
242        \x{5fffe}
243    Error -10 (bad UTF-8 string) offset=0 reason=22
244        \x{5ffff}
245    Error -10 (bad UTF-8 string) offset=0 reason=22
246        \x{6fffe}
247    Error -10 (bad UTF-8 string) offset=0 reason=22
248        \x{6ffff}
249    Error -10 (bad UTF-8 string) offset=0 reason=22
250        \x{7fffe}
251    Error -10 (bad UTF-8 string) offset=0 reason=22
252        \x{7ffff}
253    Error -10 (bad UTF-8 string) offset=0 reason=22
254        \x{8fffe}
255    Error -10 (bad UTF-8 string) offset=0 reason=22
256        \x{8ffff}
257    Error -10 (bad UTF-8 string) offset=0 reason=22
258        \x{9fffe}
259    Error -10 (bad UTF-8 string) offset=0 reason=22
260        \x{9ffff}
261    Error -10 (bad UTF-8 string) offset=0 reason=22
262        \x{afffe}
263    Error -10 (bad UTF-8 string) offset=0 reason=22
264        \x{affff}
265    Error -10 (bad UTF-8 string) offset=0 reason=22
266        \x{bfffe}
267    Error -10 (bad UTF-8 string) offset=0 reason=22
268        \x{bffff}
269    Error -10 (bad UTF-8 string) offset=0 reason=22
270        \x{cfffe}
271    Error -10 (bad UTF-8 string) offset=0 reason=22
272        \x{cffff}
273    Error -10 (bad UTF-8 string) offset=0 reason=22
274        \x{dfffe}
275    Error -10 (bad UTF-8 string) offset=0 reason=22
276        \x{dffff}
277    Error -10 (bad UTF-8 string) offset=0 reason=22
278        \x{efffe}
279    Error -10 (bad UTF-8 string) offset=0 reason=22
280        \x{effff}
281    Error -10 (bad UTF-8 string) offset=0 reason=22
282        \x{ffffe}
283    Error -10 (bad UTF-8 string) offset=0 reason=22
284        \x{fffff}
285    Error -10 (bad UTF-8 string) offset=0 reason=22
286        \x{10fffe}
287    Error -10 (bad UTF-8 string) offset=0 reason=22
288        \x{10ffff}
289    Error -10 (bad UTF-8 string) offset=0 reason=22
290        \x{fdd0}
291    Error -10 (bad UTF-8 string) offset=0 reason=22
292        \x{fdd1}
293    Error -10 (bad UTF-8 string) offset=0 reason=22
294        \x{fdd2}
295    Error -10 (bad UTF-8 string) offset=0 reason=22
296        \x{fdd3}
297    Error -10 (bad UTF-8 string) offset=0 reason=22
298        \x{fdd4}
299    Error -10 (bad UTF-8 string) offset=0 reason=22
300        \x{fdd5}
301    Error -10 (bad UTF-8 string) offset=0 reason=22
302        \x{fdd6}
303    Error -10 (bad UTF-8 string) offset=0 reason=22
304        \x{fdd7}
305    Error -10 (bad UTF-8 string) offset=0 reason=22
306        \x{fdd8}
307    Error -10 (bad UTF-8 string) offset=0 reason=22
308        \x{fdd9}
309    Error -10 (bad UTF-8 string) offset=0 reason=22
310        \x{fdda}
311    Error -10 (bad UTF-8 string) offset=0 reason=22
312        \x{fddb}
313    Error -10 (bad UTF-8 string) offset=0 reason=22
314        \x{fddc}
315    Error -10 (bad UTF-8 string) offset=0 reason=22
316        \x{fddd}
317    Error -10 (bad UTF-8 string) offset=0 reason=22
318        \x{fdde}
319    Error -10 (bad UTF-8 string) offset=0 reason=22
320        \x{fddf}
321    Error -10 (bad UTF-8 string) offset=0 reason=22
322        \x{fde0}
323    Error -10 (bad UTF-8 string) offset=0 reason=22
324        \x{fde1}
325    Error -10 (bad UTF-8 string) offset=0 reason=22
326        \x{fde2}
327    Error -10 (bad UTF-8 string) offset=0 reason=22
328        \x{fde3}
329    Error -10 (bad UTF-8 string) offset=0 reason=22
330        \x{fde4}
331    Error -10 (bad UTF-8 string) offset=0 reason=22
332        \x{fde5}
333    Error -10 (bad UTF-8 string) offset=0 reason=22
334        \x{fde6}
335    Error -10 (bad UTF-8 string) offset=0 reason=22
336        \x{fde7}
337    Error -10 (bad UTF-8 string) offset=0 reason=22
338        \x{fde8}
339    Error -10 (bad UTF-8 string) offset=0 reason=22
340        \x{fde9}
341    Error -10 (bad UTF-8 string) offset=0 reason=22
342        \x{fdea}
343    Error -10 (bad UTF-8 string) offset=0 reason=22
344        \x{fdeb}
345    Error -10 (bad UTF-8 string) offset=0 reason=22
346        \x{fdec}
347    Error -10 (bad UTF-8 string) offset=0 reason=22
348        \x{fded}
349    Error -10 (bad UTF-8 string) offset=0 reason=22
350        \x{fdee}
351    Error -10 (bad UTF-8 string) offset=0 reason=22
352        \x{fdef}
353    Error -10 (bad UTF-8 string) offset=0 reason=22
354    
355    /\x{100}/8DZ
356    ------------------------------------------------------------------
357            Bra
358            \x{100}
359            Ket
360            End
361    ------------------------------------------------------------------
362    Capturing subpattern count = 0
363    Options: utf
364    First char = \x{c4}
365    Need char = \x{80}
366    
367    /\x{1000}/8DZ
368    ------------------------------------------------------------------
369            Bra
370            \x{1000}
371            Ket
372            End
373    ------------------------------------------------------------------
374    Capturing subpattern count = 0
375    Options: utf
376    First char = \x{e1}
377    Need char = \x{80}
378    
379    /\x{10000}/8DZ
380    ------------------------------------------------------------------
381            Bra
382            \x{10000}
383            Ket
384            End
385    ------------------------------------------------------------------
386    Capturing subpattern count = 0
387    Options: utf
388    First char = \x{f0}
389    Need char = \x{80}
390    
391    /\x{100000}/8DZ
392    ------------------------------------------------------------------
393            Bra
394            \x{100000}
395            Ket
396            End
397    ------------------------------------------------------------------
398    Capturing subpattern count = 0
399    Options: utf
400    First char = \x{f4}
401    Need char = \x{80}
402    
403    /\x{10ffff}/8DZ
404    ------------------------------------------------------------------
405            Bra
406            \x{10ffff}
407            Ket
408            End
409    ------------------------------------------------------------------
410    Capturing subpattern count = 0
411    Options: utf
412    First char = \x{f4}
413    Need char = \x{bf}
414    
415    /[\x{ff}]/8DZ
416    ------------------------------------------------------------------
417            Bra
418            \x{ff}
419            Ket
420            End
421    ------------------------------------------------------------------
422    Capturing subpattern count = 0
423    Options: utf
424    First char = \x{c3}
425    Need char = \x{bf}
426    
427    /[\x{100}]/8DZ
428    ------------------------------------------------------------------
429            Bra
430            \x{100}
431            Ket
432            End
433    ------------------------------------------------------------------
434    Capturing subpattern count = 0
435    Options: utf
436    First char = \x{c4}
437    Need char = \x{80}
438    
439    /\x80/8DZ
440    ------------------------------------------------------------------
441            Bra
442            \x{80}
443            Ket
444            End
445    ------------------------------------------------------------------
446    Capturing subpattern count = 0
447    Options: utf
448    First char = \x{c2}
449    Need char = \x{80}
450    
451    /\xff/8DZ
452    ------------------------------------------------------------------
453            Bra
454            \x{ff}
455            Ket
456            End
457    ------------------------------------------------------------------
458    Capturing subpattern count = 0
459    Options: utf
460    First char = \x{c3}
461    Need char = \x{bf}
462    
463    /\x{D55c}\x{ad6d}\x{C5B4}/DZ8
464    ------------------------------------------------------------------
465            Bra
466            \x{d55c}\x{ad6d}\x{c5b4}
467            Ket
468            End
469    ------------------------------------------------------------------
470    Capturing subpattern count = 0
471    Options: utf
472    First char = \x{ed}
473    Need char = \x{b4}
474        \x{D55c}\x{ad6d}\x{C5B4}
475     0: \x{d55c}\x{ad6d}\x{c5b4}
476    
477    /\x{65e5}\x{672c}\x{8a9e}/DZ8
478    ------------------------------------------------------------------
479            Bra
480            \x{65e5}\x{672c}\x{8a9e}
481            Ket
482            End
483    ------------------------------------------------------------------
484    Capturing subpattern count = 0
485    Options: utf
486    First char = \x{e6}
487    Need char = \x{9e}
488        \x{65e5}\x{672c}\x{8a9e}
489     0: \x{65e5}\x{672c}\x{8a9e}
490    
491    /\x{80}/DZ8
492    ------------------------------------------------------------------
493            Bra
494            \x{80}
495            Ket
496            End
497    ------------------------------------------------------------------
498    Capturing subpattern count = 0
499    Options: utf
500    First char = \x{c2}
501    Need char = \x{80}
502    
503    /\x{084}/DZ8
504    ------------------------------------------------------------------
505            Bra
506            \x{84}
507            Ket
508            End
509    ------------------------------------------------------------------
510    Capturing subpattern count = 0
511    Options: utf
512    First char = \x{c2}
513    Need char = \x{84}
514    
515    /\x{104}/DZ8
516    ------------------------------------------------------------------
517            Bra
518            \x{104}
519            Ket
520            End
521    ------------------------------------------------------------------
522    Capturing subpattern count = 0
523    Options: utf
524    First char = \x{c4}
525    Need char = \x{84}
526    
527    /\x{861}/DZ8
528    ------------------------------------------------------------------
529            Bra
530            \x{861}
531            Ket
532            End
533    ------------------------------------------------------------------
534    Capturing subpattern count = 0
535    Options: utf
536    First char = \x{e0}
537    Need char = \x{a1}
538    
539    /\x{212ab}/DZ8
540    ------------------------------------------------------------------
541            Bra
542            \x{212ab}
543            Ket
544            End
545    ------------------------------------------------------------------
546    Capturing subpattern count = 0
547    Options: utf
548    First char = \x{f0}
549    Need char = \x{ab}
550    
551    /-- This one is here not because it's different to Perl, but because the way
552    the captured single-byte is displayed. (In Perl it becomes a character, and you
553    can't tell the difference.) --/
554    
555    /X(\C)(.*)/8
556        X\x{1234}
557     0: X\x{1234}
558     1: \x{e1}
559     2: \x{88}\x{b4}
560        X\nabc
561     0: X\x{0a}abc
562     1: \x{0a}
563     2: abc
564    
565    /-- This one is here because Perl gives out a grumbly error message (quite
566    correctly, but that messes up comparisons). --/
567    
568    /a\Cb/8
569        *** Failers
570    No match
571        a\x{100}b
572    No match
573    
574    /[^ab\xC0-\xF0]/8SDZ
575    ------------------------------------------------------------------
576            Bra
577            [\x00-`c-\xbf\xf1-\xff] (neg)
578            Ket
579            End
580    ------------------------------------------------------------------
581    Capturing subpattern count = 0
582    Options: utf
583    No first char
584    No need char
585    Subject length lower bound = 1
586    Starting byte set: \x00 \x01 \x02 \x03 \x04 \x05 \x06 \x07 \x08 \x09 \x0a
587      \x0b \x0c \x0d \x0e \x0f \x10 \x11 \x12 \x13 \x14 \x15 \x16 \x17 \x18 \x19
588      \x1a \x1b \x1c \x1d \x1e \x1f \x20 ! " # $ % & ' ( ) * + , - . / 0 1 2 3 4
589      5 6 7 8 9 : ; < = > ? @ A B C D E F G H I J K L M N O P Q R S T U V W X Y
590      Z [ \ ] ^ _ ` c d e f g h i j k l m n o p q r s t u v w x y z { | } ~ \x7f
591      \xc2 \xc3 \xc4 \xc5 \xc6 \xc7 \xc8 \xc9 \xca \xcb \xcc \xcd \xce \xcf \xd0
592      \xd1 \xd2 \xd3 \xd4 \xd5 \xd6 \xd7 \xd8 \xd9 \xda \xdb \xdc \xdd \xde \xdf
593      \xe0 \xe1 \xe2 \xe3 \xe4 \xe5 \xe6 \xe7 \xe8 \xe9 \xea \xeb \xec \xed \xee
594      \xef \xf0 \xf1 \xf2 \xf3 \xf4 \xf5 \xf6 \xf7 \xf8 \xf9 \xfa \xfb \xfc \xfd
595      \xfe \xff
596        \x{f1}
597     0: \x{f1}
598        \x{bf}
599     0: \x{bf}
600        \x{100}
601     0: \x{100}
602        \x{1000}
603     0: \x{1000}
604        *** Failers
605     0: *
606        \x{c0}
607    No match
608        \x{f0}
609    No match
610    
611    /Ā{3,4}/8SDZ
612    ------------------------------------------------------------------
613            Bra
614            \x{100}{3}
615            \x{100}?
616            Ket
617            End
618    ------------------------------------------------------------------
619    Capturing subpattern count = 0
620    Options: utf
621    First char = \x{c4}
622    Need char = \x{80}
623  Subject length lower bound = 3  Subject length lower bound = 3
624  No set of starting bytes  No set of starting bytes
625  JIT support is not available in this version of PCRE    \x{100}\x{100}\x{100}\x{100\x{100}
626     0: \x{100}\x{100}\x{100}
627    
628  /\p{Xps}*/SI  /(\x{100}+|x)/8SDZ
629    ------------------------------------------------------------------
630            Bra
631            CBra 1
632            \x{100}+
633            Alt
634            x
635            Ket
636            Ket
637            End
638    ------------------------------------------------------------------
639    Capturing subpattern count = 1
640    Options: utf
641    No first char
642    No need char
643    Subject length lower bound = 1
644    Starting byte set: x \xc4
645    
646    /(\x{100}*a|x)/8SDZ
647    ------------------------------------------------------------------
648            Bra
649            CBra 1
650            \x{100}*+
651            a
652            Alt
653            x
654            Ket
655            Ket
656            End
657    ------------------------------------------------------------------
658    Capturing subpattern count = 1
659    Options: utf
660    No first char
661    No need char
662    Subject length lower bound = 1
663    Starting byte set: a x \xc4
664    
665    /(\x{100}{0,2}a|x)/8SDZ
666    ------------------------------------------------------------------
667            Bra
668            CBra 1
669            \x{100}{0,2}
670            a
671            Alt
672            x
673            Ket
674            Ket
675            End
676    ------------------------------------------------------------------
677    Capturing subpattern count = 1
678    Options: utf
679    No first char
680    No need char
681    Subject length lower bound = 1
682    Starting byte set: a x \xc4
683    
684    /(\x{100}{1,2}a|x)/8SDZ
685    ------------------------------------------------------------------
686            Bra
687            CBra 1
688            \x{100}
689            \x{100}{0,1}
690            a
691            Alt
692            x
693            Ket
694            Ket
695            End
696    ------------------------------------------------------------------
697    Capturing subpattern count = 1
698    Options: utf
699    No first char
700    No need char
701    Subject length lower bound = 1
702    Starting byte set: x \xc4
703    
704    /\x{100}/8DZ
705    ------------------------------------------------------------------
706            Bra
707            \x{100}
708            Ket
709            End
710    ------------------------------------------------------------------
711    Capturing subpattern count = 0
712    Options: utf
713    First char = \x{c4}
714    Need char = \x{80}
715    
716    /a\x{100}\x{101}*/8DZ
717    ------------------------------------------------------------------
718            Bra
719            a\x{100}
720            \x{101}*
721            Ket
722            End
723    ------------------------------------------------------------------
724    Capturing subpattern count = 0
725    Options: utf
726    First char = 'a'
727    Need char = \x{80}
728    
729    /a\x{100}\x{101}+/8DZ
730    ------------------------------------------------------------------
731            Bra
732            a\x{100}
733            \x{101}+
734            Ket
735            End
736    ------------------------------------------------------------------
737    Capturing subpattern count = 0
738    Options: utf
739    First char = 'a'
740    Need char = \x{81}
741    
742    /[^\x{c4}]/DZ
743    ------------------------------------------------------------------
744            Bra
745            [^\x{c4}]
746            Ket
747            End
748    ------------------------------------------------------------------
749  Capturing subpattern count = 0  Capturing subpattern count = 0
750  No options  No options
751  No first char  No first char
752  No need char  No need char
753  Study returned NULL  
754  JIT support is not available in this version of PCRE  /[\x{100}]/8DZ
755    ------------------------------------------------------------------
756            Bra
757            \x{100}
758            Ket
759            End
760    ------------------------------------------------------------------
761    Capturing subpattern count = 0
762    Options: utf
763    First char = \x{c4}
764    Need char = \x{80}
765        \x{100}
766     0: \x{100}
767        Z\x{100}
768     0: \x{100}
769        \x{100}Z
770     0: \x{100}
771        *** Failers
772    No match
773    
774    /[\xff]/DZ8
775    ------------------------------------------------------------------
776            Bra
777            \x{ff}
778            Ket
779            End
780    ------------------------------------------------------------------
781    Capturing subpattern count = 0
782    Options: utf
783    First char = \x{c3}
784    Need char = \x{bf}
785        >\x{ff}<
786     0: \x{ff}
787    
788    /[^\xff]/8DZ
789    ------------------------------------------------------------------
790            Bra
791            [^\x{ff}]
792            Ket
793            End
794    ------------------------------------------------------------------
795    Capturing subpattern count = 0
796    Options: utf
797    No first char
798    No need char
799    
800    /\x{100}abc(xyz(?1))/8DZ
801    ------------------------------------------------------------------
802            Bra
803            \x{100}abc
804            CBra 1
805            xyz
806            Recurse
807            Ket
808            Ket
809            End
810    ------------------------------------------------------------------
811    Capturing subpattern count = 1
812    Options: utf
813    First char = \x{c4}
814    Need char = 'z'
815    
816    /a\x{1234}b/P8
817        a\x{1234}b
818     0: a\x{1234}b
819    
820    /\777/8I
821    Capturing subpattern count = 0
822    Options: utf
823    First char = \x{c7}
824    Need char = \x{bf}
825      \x{1ff}
826     0: \x{1ff}
827      \777
828     0: \x{1ff}
829    
830    /\x{100}+\x{200}/8DZ
831    ------------------------------------------------------------------
832            Bra
833            \x{100}++
834            \x{200}
835            Ket
836            End
837    ------------------------------------------------------------------
838    Capturing subpattern count = 0
839    Options: utf
840    First char = \x{c4}
841    Need char = \x{80}
842    
843    /\x{100}+X/8DZ
844    ------------------------------------------------------------------
845            Bra
846            \x{100}++
847            X
848            Ket
849            End
850    ------------------------------------------------------------------
851    Capturing subpattern count = 0
852    Options: utf
853    First char = \x{c4}
854    Need char = 'X'
855    
856    /^[\QĀ\E-\QŐ\E/BZ8
857    Failed: missing terminating ] for character class at offset 15
858    
859    /-- This tests the stricter UTF-8 check according to RFC 3629. --/
860    
861    /X/8
862        \x{0}\x{d7ff}\x{e000}\x{10ffff}
863    Error -10 (bad UTF-8 string) offset=7 reason=22
864        \x{d800}
865    Error -10 (bad UTF-8 string) offset=0 reason=14
866        \x{d800}\?
867    No match
868        \x{da00}
869    Error -10 (bad UTF-8 string) offset=0 reason=14
870        \x{da00}\?
871    No match
872        \x{dfff}
873    Error -10 (bad UTF-8 string) offset=0 reason=14
874        \x{dfff}\?
875    No match
876        \x{110000}
877    Error -10 (bad UTF-8 string) offset=0 reason=13
878        \x{110000}\?
879    No match
880        \x{2000000}
881    Error -10 (bad UTF-8 string) offset=0 reason=11
882        \x{2000000}\?
883    No match
884        \x{7fffffff}
885    Error -10 (bad UTF-8 string) offset=0 reason=12
886        \x{7fffffff}\?
887    No match
888    
889    /(*UTF8)\x{1234}/
890      abcd\x{1234}pqr
891     0: \x{1234}
892    
893    /(*CRLF)(*UTF8)(*BSR_UNICODE)a\Rb/I
894    Capturing subpattern count = 0
895    Options: bsr_unicode utf
896    Forced newline sequence: CRLF
897    First char = 'a'
898    Need char = 'b'
899    
900    /\h/SI8
901    Capturing subpattern count = 0
902    Options: utf
903    No first char
904    No need char
905    Subject length lower bound = 1
906    Starting byte set: \x09 \x20 \xc2 \xe1 \xe2 \xe3
907        ABC\x{09}
908     0: \x{09}
909        ABC\x{20}
910     0:
911        ABC\x{a0}
912     0: \x{a0}
913        ABC\x{1680}
914     0: \x{1680}
915        ABC\x{180e}
916     0: \x{180e}
917        ABC\x{2000}
918     0: \x{2000}
919        ABC\x{202f}
920     0: \x{202f}
921        ABC\x{205f}
922     0: \x{205f}
923        ABC\x{3000}
924     0: \x{3000}
925    
926    /\v/SI8
927    Capturing subpattern count = 0
928    Options: utf
929    No first char
930    No need char
931    Subject length lower bound = 1
932    Starting byte set: \x0a \x0b \x0c \x0d \xc2 \xe2
933        ABC\x{0a}
934     0: \x{0a}
935        ABC\x{0b}
936     0: \x{0b}
937        ABC\x{0c}
938     0: \x{0c}
939        ABC\x{0d}
940     0: \x{0d}
941        ABC\x{85}
942     0: \x{85}
943        ABC\x{2028}
944     0: \x{2028}
945    
946    /\h*A/SI8
947    Capturing subpattern count = 0
948    Options: utf
949    No first char
950    Need char = 'A'
951    Subject length lower bound = 1
952    Starting byte set: \x09 \x20 A \xc2 \xe1 \xe2 \xe3
953        CDBABC
954     0: A
955    
956    /\v+A/SI8
957    Capturing subpattern count = 0
958    Options: utf
959    No first char
960    Need char = 'A'
961    Subject length lower bound = 2
962    Starting byte set: \x0a \x0b \x0c \x0d \xc2 \xe2
963    
964    /\s?xxx\s/8SI
965    Capturing subpattern count = 0
966    Options: utf
967    No first char
968    Need char = 'x'
969    Subject length lower bound = 4
970    Starting byte set: \x09 \x0a \x0c \x0d \x20 x
971    
972    /\sxxx\s/I8ST1
973    Capturing subpattern count = 0
974    Options: utf
975    No first char
976    Need char = 'x'
977    Subject length lower bound = 5
978    Starting byte set: \x09 \x0a \x0c \x0d \x20 \xc2
979        AB\x{85}xxx\x{a0}XYZ
980     0: \x{85}xxx\x{a0}
981        AB\x{a0}xxx\x{85}XYZ
982     0: \x{a0}xxx\x{85}
983    
984    /\S \S/I8ST1
985    Capturing subpattern count = 0
986    Options: utf
987    No first char
988    Need char = ' '
989    Subject length lower bound = 3
990    Starting byte set: \x00 \x01 \x02 \x03 \x04 \x05 \x06 \x07 \x08 \x0b \x0e
991      \x0f \x10 \x11 \x12 \x13 \x14 \x15 \x16 \x17 \x18 \x19 \x1a \x1b \x1c \x1d
992      \x1e \x1f ! " # $ % & ' ( ) * + , - . / 0 1 2 3 4 5 6 7 8 9 : ; < = > ? @
993      A B C D E F G H I J K L M N O P Q R S T U V W X Y Z [ \ ] ^ _ ` a b c d e
994      f g h i j k l m n o p q r s t u v w x y z { | } ~ \x7f \xc0 \xc1 \xc2 \xc3
995      \xc4 \xc5 \xc6 \xc7 \xc8 \xc9 \xca \xcb \xcc \xcd \xce \xcf \xd0 \xd1 \xd2
996      \xd3 \xd4 \xd5 \xd6 \xd7 \xd8 \xd9 \xda \xdb \xdc \xdd \xde \xdf \xe0 \xe1
997      \xe2 \xe3 \xe4 \xe5 \xe6 \xe7 \xe8 \xe9 \xea \xeb \xec \xed \xee \xef \xf0
998      \xf1 \xf2 \xf3 \xf4 \xf5 \xf6 \xf7 \xf8 \xf9 \xfa \xfb \xfc \xfd \xfe \xff
999        \x{a2} \x{84}
1000     0: \x{a2} \x{84}
1001        A Z
1002     0: A Z
1003    
1004    /a+/8
1005        a\x{123}aa\>1
1006     0: aa
1007        a\x{123}aa\>2
1008    Error -11 (bad UTF-8 offset)
1009        a\x{123}aa\>3
1010     0: aa
1011        a\x{123}aa\>4
1012     0: a
1013        a\x{123}aa\>5
1014    No match
1015        a\x{123}aa\>6
1016    Error -24 (bad offset value)
1017    
1018    /\x{1234}+/iS8I
1019    Capturing subpattern count = 0
1020    Options: caseless utf
1021    No first char
1022    No need char
1023    Subject length lower bound = 1
1024    Starting byte set: \xe1
1025    
1026    /\x{1234}+?/iS8I
1027    Capturing subpattern count = 0
1028    Options: caseless utf
1029    No first char
1030    No need char
1031    Subject length lower bound = 1
1032    Starting byte set: \xe1
1033    
1034    /\x{1234}++/iS8I
1035    Capturing subpattern count = 0
1036    Options: caseless utf
1037    No first char
1038    No need char
1039    Subject length lower bound = 1
1040    Starting byte set: \xe1
1041    
1042    /\x{1234}{2}/iS8I
1043    Capturing subpattern count = 0
1044    Options: caseless utf
1045    No first char
1046    No need char
1047    Subject length lower bound = 2
1048    Starting byte set: \xe1
1049    
1050    /[^\x{c4}]/8DZ
1051    ------------------------------------------------------------------
1052            Bra
1053            [^\x{c4}]
1054            Ket
1055            End
1056    ------------------------------------------------------------------
1057    Capturing subpattern count = 0
1058    Options: utf
1059    No first char
1060    No need char
1061    
1062    /X+\x{200}/8DZ
1063    ------------------------------------------------------------------
1064            Bra
1065            X++
1066            \x{200}
1067            Ket
1068            End
1069    ------------------------------------------------------------------
1070    Capturing subpattern count = 0
1071    Options: utf
1072    First char = 'X'
1073    Need char = \x{80}
1074    
1075    /\R/SI8
1076    Capturing subpattern count = 0
1077    Options: utf
1078    No first char
1079    No need char
1080    Subject length lower bound = 1
1081    Starting byte set: \x0a \x0b \x0c \x0d \xc2 \xe2
1082    
1083    /\777/8DZ
1084    ------------------------------------------------------------------
1085            Bra
1086            \x{1ff}
1087            Ket
1088            End
1089    ------------------------------------------------------------------
1090    Capturing subpattern count = 0
1091    Options: utf
1092    First char = \x{c7}
1093    Need char = \x{bf}
1094    
1095    /\w+\x{C4}/8BZ
1096    ------------------------------------------------------------------
1097            Bra
1098            \w++
1099            \x{c4}
1100            Ket
1101            End
1102    ------------------------------------------------------------------
1103        a\x{C4}\x{C4}
1104     0: a\x{c4}
1105    
1106    /\w+\x{C4}/8BZT1
1107    ------------------------------------------------------------------
1108            Bra
1109            \w+
1110            \x{c4}
1111            Ket
1112            End
1113    ------------------------------------------------------------------
1114        a\x{C4}\x{C4}
1115     0: a\x{c4}\x{c4}
1116    
1117    /\W+\x{C4}/8BZ
1118    ------------------------------------------------------------------
1119            Bra
1120            \W+
1121            \x{c4}
1122            Ket
1123            End
1124    ------------------------------------------------------------------
1125        !\x{C4}
1126     0: !\x{c4}
1127    
1128    /\W+\x{C4}/8BZT1
1129    ------------------------------------------------------------------
1130            Bra
1131            \W++
1132            \x{c4}
1133            Ket
1134            End
1135    ------------------------------------------------------------------
1136        !\x{C4}
1137     0: !\x{c4}
1138    
1139    /\W+\x{A1}/8BZ
1140    ------------------------------------------------------------------
1141            Bra
1142            \W+
1143            \x{a1}
1144            Ket
1145            End
1146    ------------------------------------------------------------------
1147        !\x{A1}
1148     0: !\x{a1}
1149    
1150    /\W+\x{A1}/8BZT1
1151    ------------------------------------------------------------------
1152            Bra
1153            \W+
1154            \x{a1}
1155            Ket
1156            End
1157    ------------------------------------------------------------------
1158        !\x{A1}
1159     0: !\x{a1}
1160    
1161    /X\s+\x{A0}/8BZ
1162    ------------------------------------------------------------------
1163            Bra
1164            X
1165            \s++
1166            \x{a0}
1167            Ket
1168            End
1169    ------------------------------------------------------------------
1170        X\x20\x{A0}\x{A0}
1171     0: X \x{a0}
1172    
1173    /X\s+\x{A0}/8BZT1
1174    ------------------------------------------------------------------
1175            Bra
1176            X
1177            \s+
1178            \x{a0}
1179            Ket
1180            End
1181    ------------------------------------------------------------------
1182        X\x20\x{A0}\x{A0}
1183     0: X \x{a0}\x{a0}
1184    
1185    /\S+\x{A0}/8BZ
1186    ------------------------------------------------------------------
1187            Bra
1188            \S+
1189            \x{a0}
1190            Ket
1191            End
1192    ------------------------------------------------------------------
1193        X\x{A0}\x{A0}
1194     0: X\x{a0}\x{a0}
1195    
1196    /\S+\x{A0}/8BZT1
1197    ------------------------------------------------------------------
1198            Bra
1199            \S++
1200            \x{a0}
1201            Ket
1202            End
1203    ------------------------------------------------------------------
1204        X\x{A0}\x{A0}
1205     0: X\x{a0}
1206    
1207    /\x{a0}+\s!/8BZ
1208    ------------------------------------------------------------------
1209            Bra
1210            \x{a0}++
1211            \s
1212            !
1213            Ket
1214            End
1215    ------------------------------------------------------------------
1216        \x{a0}\x20!
1217     0: \x{a0} !
1218    
1219    /\x{a0}+\s!/8BZT1
1220    ------------------------------------------------------------------
1221            Bra
1222            \x{a0}+
1223            \s
1224            !
1225            Ket
1226            End
1227    ------------------------------------------------------------------
1228        \x{a0}\x20!
1229     0: \x{a0} !
1230    
1231  /-- End of testinput15 --/  /-- End of testinput15 --/

Legend:
Removed from v.689  
changed lines
  Added in v.1174

  ViewVC Help
Powered by ViewVC 1.1.5