/[pcre]/code/trunk/testdata/testoutput17
ViewVC logotype

Diff of /code/trunk/testdata/testoutput17

Parent Directory Parent Directory | Revision Log Revision Log | View Patch Patch

code/branches/pcre16/testdata/testoutput17 revision 810 by ph10, Mon Dec 19 13:34:10 2011 UTC code/trunk/testdata/testoutput17 revision 1382 by zherczeg, Fri Oct 18 07:55:07 2013 UTC
# Line 1  Line 1 
1  /-- This set of tests is for UTF-8 support, and is relevant only to the 8-bit  /-- This set of tests is for the 16- and 32-bit library's basic (non-UTF-16
2      library. --/      or -32) features that are not compatible with the 8-bit library, or which
3        give different output in 16- or 32-bit mode. --/
 /X(\C{3})/8  
     X\x{1234}  
  0: X\x{1234}  
  1: \x{1234}  
   
 /X(\C{4})/8  
     X\x{1234}YZ  
  0: X\x{1234}Y  
  1: \x{1234}Y  
   
 /X\C*/8  
     XYZabcdce  
  0: XYZabcdce  
   
 /X\C*?/8  
     XYZabcde  
  0: X  
   
 /X\C{3,5}/8  
     Xabcdefg  
  0: Xabcde  
     X\x{1234}  
  0: X\x{1234}  
     X\x{1234}YZ  
  0: X\x{1234}YZ  
     X\x{1234}\x{512}  
  0: X\x{1234}\x{512}  
     X\x{1234}\x{512}YZ  
  0: X\x{1234}\x{512}  
   
 /X\C{3,5}?/8  
     Xabcdefg  
  0: Xabc  
     X\x{1234}  
  0: X\x{1234}  
     X\x{1234}YZ  
  0: X\x{1234}  
     X\x{1234}\x{512}  
  0: X\x{1234}  
4    
5  /a\Cb/  /a\Cb/
6      aXb      aXb
# Line 47  Line 8 
8      a\nb      a\nb
9   0: a\x0ab   0: a\x0ab
10    
11  /a\Cb/8  /[^\x{c4}]/DZ
     aXb  
  0: aXb  
     a\nb  
  0: a\x{0a}b  
   
 /a\C\Cb/8  
     a\x{100}b  
  0: a\x{100}b  
   
 /ab\Cde/8  
     abXde  
  0: abXde  
   
 /a\C\Cb/8  
     a\x{100}b  
  0: a\x{100}b  
     ** Failers  
 No match  
     a\x{12257}b  
 No match  
   
 /[]/8  
 Failed: invalid UTF-8 string at offset 1  
   
 //8  
 Failed: invalid UTF-8 string at offset 0  
   
 /xxx/8  
 Failed: invalid UTF-8 string at offset 0  
   
 /xxx/8?DZSS  
 ------------------------------------------------------------------  
         Bra  
         \X{c0}\X{c0}\X{c0}xxx  
         Ket  
         End  
 ------------------------------------------------------------------  
 Capturing subpattern count = 0  
 Options: utf no_utf_check  
 First char = \x{c3}  
 Need char = 'x'  
   
 /abc/8  
     ]  
 Error -10 (bad UTF-8 string) offset=0 reason=6  
       
 Error -10 (bad UTF-8 string) offset=0 reason=1  
       
 Error -10 (bad UTF-8 string) offset=0 reason=6  
     \?  
 No match  
     \xe1\x88  
 Error -10 (bad UTF-8 string) offset=0 reason=1  
     \P\xe1\x88  
 Error -10 (bad UTF-8 string) offset=0 reason=1  
     \P\P\xe1\x88  
 Error -25 (short UTF-8 string) offset=0 reason=1  
     XX\xea  
 Error -10 (bad UTF-8 string) offset=2 reason=2  
     \O0XX\xea  
 Error -10 (bad UTF-8 string)  
     \O1XX\xea  
 Error -10 (bad UTF-8 string)  
     \O2XX\xea  
 Error -10 (bad UTF-8 string) offset=2 reason=2  
     XX\xf1  
 Error -10 (bad UTF-8 string) offset=2 reason=3  
     XX\xf8  
 Error -10 (bad UTF-8 string) offset=2 reason=4  
     XX\xfc  
 Error -10 (bad UTF-8 string) offset=2 reason=5  
     ZZ\xea\xaf\x20YY  
 Error -10 (bad UTF-8 string) offset=2 reason=7  
     ZZ\xfd\xbf\xbf\x2f\xbf\xbfYY  
 Error -10 (bad UTF-8 string) offset=2 reason=8  
     ZZ\xfd\xbf\xbf\xbf\x2f\xbfYY  
 Error -10 (bad UTF-8 string) offset=2 reason=9  
     ZZ\xfd\xbf\xbf\xbf\xbf\x2fYY  
 Error -10 (bad UTF-8 string) offset=2 reason=10  
     ZZ\xffYY  
 Error -10 (bad UTF-8 string) offset=2 reason=21  
     ZZ\xfeYY  
 Error -10 (bad UTF-8 string) offset=2 reason=21  
   
 /anything/8  
     \xc0\x80  
 Error -10 (bad UTF-8 string) offset=0 reason=15  
     \xc1\x8f  
 Error -10 (bad UTF-8 string) offset=0 reason=15  
     \xe0\x9f\x80  
 Error -10 (bad UTF-8 string) offset=0 reason=16  
     \xf0\x8f\x80\x80  
 Error -10 (bad UTF-8 string) offset=0 reason=17  
     \xf8\x87\x80\x80\x80  
 Error -10 (bad UTF-8 string) offset=0 reason=18  
     \xfc\x83\x80\x80\x80\x80  
 Error -10 (bad UTF-8 string) offset=0 reason=19  
     \xfe\x80\x80\x80\x80\x80  
 Error -10 (bad UTF-8 string) offset=0 reason=21  
     \xff\x80\x80\x80\x80\x80  
 Error -10 (bad UTF-8 string) offset=0 reason=21  
     \xc3\x8f  
 No match  
     \xe0\xaf\x80  
 No match  
     \xe1\x80\x80  
 No match  
     \xf0\x9f\x80\x80  
 No match  
     \xf1\x8f\x80\x80  
 No match  
     \xf8\x88\x80\x80\x80  
 Error -10 (bad UTF-8 string) offset=0 reason=11  
     \xf9\x87\x80\x80\x80  
 Error -10 (bad UTF-8 string) offset=0 reason=11  
     \xfc\x84\x80\x80\x80\x80  
 Error -10 (bad UTF-8 string) offset=0 reason=12  
     \xfd\x83\x80\x80\x80\x80  
 Error -10 (bad UTF-8 string) offset=0 reason=12  
     \?\xf8\x88\x80\x80\x80  
 No match  
     \?\xf9\x87\x80\x80\x80  
 No match  
     \?\xfc\x84\x80\x80\x80\x80  
 No match  
     \?\xfd\x83\x80\x80\x80\x80  
 No match  
   
 /\x{100}/8DZ  
 ------------------------------------------------------------------  
         Bra  
         \x{100}  
         Ket  
         End  
 ------------------------------------------------------------------  
 Capturing subpattern count = 0  
 Options: utf  
 First char = \x{c4}  
 Need char = 128  
   
 /\x{1000}/8DZ  
 ------------------------------------------------------------------  
         Bra  
         \x{1000}  
         Ket  
         End  
 ------------------------------------------------------------------  
 Capturing subpattern count = 0  
 Options: utf  
 First char = \x{e1}  
 Need char = 128  
   
 /\x{10000}/8DZ  
 ------------------------------------------------------------------  
         Bra  
         \x{10000}  
         Ket  
         End  
 ------------------------------------------------------------------  
 Capturing subpattern count = 0  
 Options: utf  
 First char = \x{f0}  
 Need char = 128  
   
 /\x{100000}/8DZ  
 ------------------------------------------------------------------  
         Bra  
         \x{100000}  
         Ket  
         End  
 ------------------------------------------------------------------  
 Capturing subpattern count = 0  
 Options: utf  
 First char = \x{f4}  
 Need char = 128  
   
 /\x{10ffff}/8DZ  
 ------------------------------------------------------------------  
         Bra  
         \x{10ffff}  
         Ket  
         End  
 ------------------------------------------------------------------  
 Capturing subpattern count = 0  
 Options: utf  
 First char = \x{f4}  
 Need char = 191  
   
 /[\x{ff}]/8DZ  
 ------------------------------------------------------------------  
         Bra  
         \x{ff}  
         Ket  
         End  
 ------------------------------------------------------------------  
 Capturing subpattern count = 0  
 Options: utf  
 First char = \x{c3}  
 Need char = 191  
   
 /[\x{100}]/8DZ  
 ------------------------------------------------------------------  
         Bra  
         \x{100}  
         Ket  
         End  
 ------------------------------------------------------------------  
 Capturing subpattern count = 0  
 Options: utf  
 First char = \x{c4}  
 Need char = 128  
   
 /\x80/8DZ  
12  ------------------------------------------------------------------  ------------------------------------------------------------------
13          Bra          Bra
14          \x{80}          [^\x{c4}]
15          Ket          Ket
16          End          End
17  ------------------------------------------------------------------  ------------------------------------------------------------------
18  Capturing subpattern count = 0  Capturing subpattern count = 0
19  Options: utf  No options
20  First char = \x{c2}  No first char
21  Need char = 128  No need char
22    
23  /\xff/8DZ  /\x{100}/I
 ------------------------------------------------------------------  
         Bra  
         \x{ff}  
         Ket  
         End  
 ------------------------------------------------------------------  
24  Capturing subpattern count = 0  Capturing subpattern count = 0
25  Options: utf  No options
26  First char = \x{c3}  First char = \x{100}
27  Need char = 191  No need char
28    
29  /\x{D55c}\x{ad6d}\x{C5B4}/DZ8  /  (?: [\040\t] |  \(
30  ------------------------------------------------------------------  (?:  [^\\\x80-\xff\n\015()]  |  \\ [^\x80-\xff]  |  \( (?:  [^\\\x80-\xff\n\015()]  |  \\ [^\x80-\xff]  )* \)  )*
31          Bra  \)  )*                          # optional leading comment
32          \x{d55c}\x{ad6d}\x{c5b4}  (?:    (?:
33          Ket  [^(\040)<>@,;:".\\\[\]\000-\037\x80-\xff]+    # some number of atom characters...
34          End  (?![^(\040)<>@,;:".\\\[\]\000-\037\x80-\xff]) # ..not followed by something that could be part of an atom
35  ------------------------------------------------------------------  |
36    " (?:                      # opening quote...
37    [^\\\x80-\xff\n\015"]                #   Anything except backslash and quote
38    |                     #    or
39    \\ [^\x80-\xff]           #   Escaped something (something != CR)
40    )* "  # closing quote
41    )                    # initial word
42    (?:  (?: [\040\t] |  \(
43    (?:  [^\\\x80-\xff\n\015()]  |  \\ [^\x80-\xff]  |  \( (?:  [^\\\x80-\xff\n\015()]  |  \\ [^\x80-\xff]  )* \)  )*
44    \)  )*  \.  (?: [\040\t] |  \(
45    (?:  [^\\\x80-\xff\n\015()]  |  \\ [^\x80-\xff]  |  \( (?:  [^\\\x80-\xff\n\015()]  |  \\ [^\x80-\xff]  )* \)  )*
46    \)  )*   (?:
47    [^(\040)<>@,;:".\\\[\]\000-\037\x80-\xff]+    # some number of atom characters...
48    (?![^(\040)<>@,;:".\\\[\]\000-\037\x80-\xff]) # ..not followed by something that could be part of an atom
49    |
50    " (?:                      # opening quote...
51    [^\\\x80-\xff\n\015"]                #   Anything except backslash and quote
52    |                     #    or
53    \\ [^\x80-\xff]           #   Escaped something (something != CR)
54    )* "  # closing quote
55    )  )* # further okay, if led by a period
56    (?: [\040\t] |  \(
57    (?:  [^\\\x80-\xff\n\015()]  |  \\ [^\x80-\xff]  |  \( (?:  [^\\\x80-\xff\n\015()]  |  \\ [^\x80-\xff]  )* \)  )*
58    \)  )*  @  (?: [\040\t] |  \(
59    (?:  [^\\\x80-\xff\n\015()]  |  \\ [^\x80-\xff]  |  \( (?:  [^\\\x80-\xff\n\015()]  |  \\ [^\x80-\xff]  )* \)  )*
60    \)  )*    (?:
61    [^(\040)<>@,;:".\\\[\]\000-\037\x80-\xff]+    # some number of atom characters...
62    (?![^(\040)<>@,;:".\\\[\]\000-\037\x80-\xff]) # ..not followed by something that could be part of an atom
63    |   \[                         # [
64    (?: [^\\\x80-\xff\n\015\[\]] |  \\ [^\x80-\xff]  )*    #    stuff
65    \]                        #           ]
66    )                           # initial subdomain
67    (?:                                  #
68    (?: [\040\t] |  \(
69    (?:  [^\\\x80-\xff\n\015()]  |  \\ [^\x80-\xff]  |  \( (?:  [^\\\x80-\xff\n\015()]  |  \\ [^\x80-\xff]  )* \)  )*
70    \)  )*  \.                        # if led by a period...
71    (?: [\040\t] |  \(
72    (?:  [^\\\x80-\xff\n\015()]  |  \\ [^\x80-\xff]  |  \( (?:  [^\\\x80-\xff\n\015()]  |  \\ [^\x80-\xff]  )* \)  )*
73    \)  )*   (?:
74    [^(\040)<>@,;:".\\\[\]\000-\037\x80-\xff]+    # some number of atom characters...
75    (?![^(\040)<>@,;:".\\\[\]\000-\037\x80-\xff]) # ..not followed by something that could be part of an atom
76    |   \[                         # [
77    (?: [^\\\x80-\xff\n\015\[\]] |  \\ [^\x80-\xff]  )*    #    stuff
78    \]                        #           ]
79    )                     #   ...further okay
80    )*
81    # address
82    |                     #  or
83    (?:
84    [^(\040)<>@,;:".\\\[\]\000-\037\x80-\xff]+    # some number of atom characters...
85    (?![^(\040)<>@,;:".\\\[\]\000-\037\x80-\xff]) # ..not followed by something that could be part of an atom
86    |
87    " (?:                      # opening quote...
88    [^\\\x80-\xff\n\015"]                #   Anything except backslash and quote
89    |                     #    or
90    \\ [^\x80-\xff]           #   Escaped something (something != CR)
91    )* "  # closing quote
92    )             # one word, optionally followed by....
93    (?:
94    [^()<>@,;:".\\\[\]\x80-\xff\000-\010\012-\037]  |  # atom and space parts, or...
95    \(
96    (?:  [^\\\x80-\xff\n\015()]  |  \\ [^\x80-\xff]  |  \( (?:  [^\\\x80-\xff\n\015()]  |  \\ [^\x80-\xff]  )* \)  )*
97    \)       |  # comments, or...
98    
99    " (?:                      # opening quote...
100    [^\\\x80-\xff\n\015"]                #   Anything except backslash and quote
101    |                     #    or
102    \\ [^\x80-\xff]           #   Escaped something (something != CR)
103    )* "  # closing quote
104    # quoted strings
105    )*
106    <  (?: [\040\t] |  \(
107    (?:  [^\\\x80-\xff\n\015()]  |  \\ [^\x80-\xff]  |  \( (?:  [^\\\x80-\xff\n\015()]  |  \\ [^\x80-\xff]  )* \)  )*
108    \)  )*                     # leading <
109    (?:  @  (?: [\040\t] |  \(
110    (?:  [^\\\x80-\xff\n\015()]  |  \\ [^\x80-\xff]  |  \( (?:  [^\\\x80-\xff\n\015()]  |  \\ [^\x80-\xff]  )* \)  )*
111    \)  )*    (?:
112    [^(\040)<>@,;:".\\\[\]\000-\037\x80-\xff]+    # some number of atom characters...
113    (?![^(\040)<>@,;:".\\\[\]\000-\037\x80-\xff]) # ..not followed by something that could be part of an atom
114    |   \[                         # [
115    (?: [^\\\x80-\xff\n\015\[\]] |  \\ [^\x80-\xff]  )*    #    stuff
116    \]                        #           ]
117    )                           # initial subdomain
118    (?:                                  #
119    (?: [\040\t] |  \(
120    (?:  [^\\\x80-\xff\n\015()]  |  \\ [^\x80-\xff]  |  \( (?:  [^\\\x80-\xff\n\015()]  |  \\ [^\x80-\xff]  )* \)  )*
121    \)  )*  \.                        # if led by a period...
122    (?: [\040\t] |  \(
123    (?:  [^\\\x80-\xff\n\015()]  |  \\ [^\x80-\xff]  |  \( (?:  [^\\\x80-\xff\n\015()]  |  \\ [^\x80-\xff]  )* \)  )*
124    \)  )*   (?:
125    [^(\040)<>@,;:".\\\[\]\000-\037\x80-\xff]+    # some number of atom characters...
126    (?![^(\040)<>@,;:".\\\[\]\000-\037\x80-\xff]) # ..not followed by something that could be part of an atom
127    |   \[                         # [
128    (?: [^\\\x80-\xff\n\015\[\]] |  \\ [^\x80-\xff]  )*    #    stuff
129    \]                        #           ]
130    )                     #   ...further okay
131    )*
132    
133    (?:  (?: [\040\t] |  \(
134    (?:  [^\\\x80-\xff\n\015()]  |  \\ [^\x80-\xff]  |  \( (?:  [^\\\x80-\xff\n\015()]  |  \\ [^\x80-\xff]  )* \)  )*
135    \)  )*  ,  (?: [\040\t] |  \(
136    (?:  [^\\\x80-\xff\n\015()]  |  \\ [^\x80-\xff]  |  \( (?:  [^\\\x80-\xff\n\015()]  |  \\ [^\x80-\xff]  )* \)  )*
137    \)  )*  @  (?: [\040\t] |  \(
138    (?:  [^\\\x80-\xff\n\015()]  |  \\ [^\x80-\xff]  |  \( (?:  [^\\\x80-\xff\n\015()]  |  \\ [^\x80-\xff]  )* \)  )*
139    \)  )*    (?:
140    [^(\040)<>@,;:".\\\[\]\000-\037\x80-\xff]+    # some number of atom characters...
141    (?![^(\040)<>@,;:".\\\[\]\000-\037\x80-\xff]) # ..not followed by something that could be part of an atom
142    |   \[                         # [
143    (?: [^\\\x80-\xff\n\015\[\]] |  \\ [^\x80-\xff]  )*    #    stuff
144    \]                        #           ]
145    )                           # initial subdomain
146    (?:                                  #
147    (?: [\040\t] |  \(
148    (?:  [^\\\x80-\xff\n\015()]  |  \\ [^\x80-\xff]  |  \( (?:  [^\\\x80-\xff\n\015()]  |  \\ [^\x80-\xff]  )* \)  )*
149    \)  )*  \.                        # if led by a period...
150    (?: [\040\t] |  \(
151    (?:  [^\\\x80-\xff\n\015()]  |  \\ [^\x80-\xff]  |  \( (?:  [^\\\x80-\xff\n\015()]  |  \\ [^\x80-\xff]  )* \)  )*
152    \)  )*   (?:
153    [^(\040)<>@,;:".\\\[\]\000-\037\x80-\xff]+    # some number of atom characters...
154    (?![^(\040)<>@,;:".\\\[\]\000-\037\x80-\xff]) # ..not followed by something that could be part of an atom
155    |   \[                         # [
156    (?: [^\\\x80-\xff\n\015\[\]] |  \\ [^\x80-\xff]  )*    #    stuff
157    \]                        #           ]
158    )                     #   ...further okay
159    )*
160    )* # further okay, if led by comma
161    :                                # closing colon
162    (?: [\040\t] |  \(
163    (?:  [^\\\x80-\xff\n\015()]  |  \\ [^\x80-\xff]  |  \( (?:  [^\\\x80-\xff\n\015()]  |  \\ [^\x80-\xff]  )* \)  )*
164    \)  )*  )? #       optional route
165    (?:
166    [^(\040)<>@,;:".\\\[\]\000-\037\x80-\xff]+    # some number of atom characters...
167    (?![^(\040)<>@,;:".\\\[\]\000-\037\x80-\xff]) # ..not followed by something that could be part of an atom
168    |
169    " (?:                      # opening quote...
170    [^\\\x80-\xff\n\015"]                #   Anything except backslash and quote
171    |                     #    or
172    \\ [^\x80-\xff]           #   Escaped something (something != CR)
173    )* "  # closing quote
174    )                    # initial word
175    (?:  (?: [\040\t] |  \(
176    (?:  [^\\\x80-\xff\n\015()]  |  \\ [^\x80-\xff]  |  \( (?:  [^\\\x80-\xff\n\015()]  |  \\ [^\x80-\xff]  )* \)  )*
177    \)  )*  \.  (?: [\040\t] |  \(
178    (?:  [^\\\x80-\xff\n\015()]  |  \\ [^\x80-\xff]  |  \( (?:  [^\\\x80-\xff\n\015()]  |  \\ [^\x80-\xff]  )* \)  )*
179    \)  )*   (?:
180    [^(\040)<>@,;:".\\\[\]\000-\037\x80-\xff]+    # some number of atom characters...
181    (?![^(\040)<>@,;:".\\\[\]\000-\037\x80-\xff]) # ..not followed by something that could be part of an atom
182    |
183    " (?:                      # opening quote...
184    [^\\\x80-\xff\n\015"]                #   Anything except backslash and quote
185    |                     #    or
186    \\ [^\x80-\xff]           #   Escaped something (something != CR)
187    )* "  # closing quote
188    )  )* # further okay, if led by a period
189    (?: [\040\t] |  \(
190    (?:  [^\\\x80-\xff\n\015()]  |  \\ [^\x80-\xff]  |  \( (?:  [^\\\x80-\xff\n\015()]  |  \\ [^\x80-\xff]  )* \)  )*
191    \)  )*  @  (?: [\040\t] |  \(
192    (?:  [^\\\x80-\xff\n\015()]  |  \\ [^\x80-\xff]  |  \( (?:  [^\\\x80-\xff\n\015()]  |  \\ [^\x80-\xff]  )* \)  )*
193    \)  )*    (?:
194    [^(\040)<>@,;:".\\\[\]\000-\037\x80-\xff]+    # some number of atom characters...
195    (?![^(\040)<>@,;:".\\\[\]\000-\037\x80-\xff]) # ..not followed by something that could be part of an atom
196    |   \[                         # [
197    (?: [^\\\x80-\xff\n\015\[\]] |  \\ [^\x80-\xff]  )*    #    stuff
198    \]                        #           ]
199    )                           # initial subdomain
200    (?:                                  #
201    (?: [\040\t] |  \(
202    (?:  [^\\\x80-\xff\n\015()]  |  \\ [^\x80-\xff]  |  \( (?:  [^\\\x80-\xff\n\015()]  |  \\ [^\x80-\xff]  )* \)  )*
203    \)  )*  \.                        # if led by a period...
204    (?: [\040\t] |  \(
205    (?:  [^\\\x80-\xff\n\015()]  |  \\ [^\x80-\xff]  |  \( (?:  [^\\\x80-\xff\n\015()]  |  \\ [^\x80-\xff]  )* \)  )*
206    \)  )*   (?:
207    [^(\040)<>@,;:".\\\[\]\000-\037\x80-\xff]+    # some number of atom characters...
208    (?![^(\040)<>@,;:".\\\[\]\000-\037\x80-\xff]) # ..not followed by something that could be part of an atom
209    |   \[                         # [
210    (?: [^\\\x80-\xff\n\015\[\]] |  \\ [^\x80-\xff]  )*    #    stuff
211    \]                        #           ]
212    )                     #   ...further okay
213    )*
214    #       address spec
215    (?: [\040\t] |  \(
216    (?:  [^\\\x80-\xff\n\015()]  |  \\ [^\x80-\xff]  |  \( (?:  [^\\\x80-\xff\n\015()]  |  \\ [^\x80-\xff]  )* \)  )*
217    \)  )*  > #                  trailing >
218    # name and address
219    )  (?: [\040\t] |  \(
220    (?:  [^\\\x80-\xff\n\015()]  |  \\ [^\x80-\xff]  |  \( (?:  [^\\\x80-\xff\n\015()]  |  \\ [^\x80-\xff]  )* \)  )*
221    \)  )*                       # optional trailing comment
222    /xSI
223  Capturing subpattern count = 0  Capturing subpattern count = 0
224  Options: utf  Contains explicit CR or LF match
225  First char = \x{ed}  Options: extended
226  Need char = 180  No first char
227      \x{D55c}\x{ad6d}\x{C5B4}  No need char
228   0: \x{d55c}\x{ad6d}\x{c5b4}  Subject length lower bound = 3
229    Starting byte set: \x09 \x20 ! " # $ % & ' ( * + - / 0 1 2 3 4 5 6 7 8
230      9 = ? A B C D E F G H I J K L M N O P Q R S T U V W X Y Z ^ _ ` a b c d e
231      f g h i j k l m n o p q r s t u v w x y z { | } ~ \x7f \xff
232    
233  /\x{65e5}\x{672c}\x{8a9e}/DZ8  /[\h]/BZ
234  ------------------------------------------------------------------  ------------------------------------------------------------------
235          Bra          Bra
236          \x{65e5}\x{672c}\x{8a9e}          [\x09 \xa0\x{1680}\x{180e}\x{2000}-\x{200a}\x{202f}\x{205f}\x{3000}]
237          Ket          Ket
238          End          End
239  ------------------------------------------------------------------  ------------------------------------------------------------------
240  Capturing subpattern count = 0      >\x09<
241  Options: utf   0: \x09
 First char = \x{e6}  
 Need char = 158  
     \x{65e5}\x{672c}\x{8a9e}  
  0: \x{65e5}\x{672c}\x{8a9e}  
242    
243  /\x{80}/DZ8  /[\h]+/BZ
244  ------------------------------------------------------------------  ------------------------------------------------------------------
245          Bra          Bra
246          \x{80}          [\x09 \xa0\x{1680}\x{180e}\x{2000}-\x{200a}\x{202f}\x{205f}\x{3000}]++
247          Ket          Ket
248          End          End
249  ------------------------------------------------------------------  ------------------------------------------------------------------
250  Capturing subpattern count = 0      >\x09\x20\xa0<
251  Options: utf   0: \x09 \xa0
 First char = \x{c2}  
 Need char = 128  
252    
253  /\x{084}/DZ8  /[\v]/BZ
254  ------------------------------------------------------------------  ------------------------------------------------------------------
255          Bra          Bra
256          \x{84}          [\x0a-\x0d\x85\x{2028}-\x{2029}]
257          Ket          Ket
258          End          End
259  ------------------------------------------------------------------  ------------------------------------------------------------------
 Capturing subpattern count = 0  
 Options: utf  
 First char = \x{c2}  
 Need char = 132  
260    
261  /\x{104}/DZ8  /[^\h]/BZ
262  ------------------------------------------------------------------  ------------------------------------------------------------------
263          Bra          Bra
264          \x{104}          [^\x09 \xa0\x{1680}\x{180e}\x{2000}-\x{200a}\x{202f}\x{205f}\x{3000}]
265          Ket          Ket
266          End          End
267  ------------------------------------------------------------------  ------------------------------------------------------------------
 Capturing subpattern count = 0  
 Options: utf  
 First char = \x{c4}  
 Need char = 132  
268    
269  /\x{861}/DZ8  /\h+/SI
 ------------------------------------------------------------------  
         Bra  
         \x{861}  
         Ket  
         End  
 ------------------------------------------------------------------  
270  Capturing subpattern count = 0  Capturing subpattern count = 0
271  Options: utf  No options
272  First char = \x{e0}  No first char
273  Need char = 161  No need char
274    Subject length lower bound = 1
275    Starting byte set: \x09 \x20 \xa0 \xff
276        \x{1681}\x{200b}\x{1680}\x{2000}\x{202f}\x{3000}
277     0: \x{1680}\x{2000}\x{202f}\x{3000}
278        \x{3001}\x{2fff}\x{200a}\xa0\x{2000}
279     0: \x{200a}\xa0\x{2000}
280    
281  /\x{212ab}/DZ8  /[\h\x{dc00}]+/BZSI
282  ------------------------------------------------------------------  ------------------------------------------------------------------
283          Bra          Bra
284          \x{212ab}          [\x09 \xa0\x{1680}\x{180e}\x{2000}-\x{200a}\x{202f}\x{205f}\x{3000}\x{dc00}]++
285          Ket          Ket
286          End          End
287  ------------------------------------------------------------------  ------------------------------------------------------------------
288  Capturing subpattern count = 0  Capturing subpattern count = 0
289  Options: utf  No options
290  First char = \x{f0}  No first char
291  Need char = 171  No need char
292    Subject length lower bound = 1
293  /-- This one is here not because it's different to Perl, but because the way  No set of starting bytes
294  the captured single-byte is displayed. (In Perl it becomes a character, and you      \x{1681}\x{200b}\x{1680}\x{2000}\x{202f}\x{3000}
295  can't tell the difference.) --/   0: \x{1680}\x{2000}\x{202f}\x{3000}
296        \x{3001}\x{2fff}\x{200a}\xa0\x{2000}
297  /X(\C)(.*)/8   0: \x{200a}\xa0\x{2000}
     X\x{1234}  
  0: X\x{1234}  
  1: \x{e1}  
  2: \x{88}\x{b4}  
     X\nabc  
  0: X\x{0a}abc  
  1: \x{0a}  
  2: abc  
298    
299  /-- This one is here because Perl gives out a grumbly error message (quite  /\H+/SI
 correctly, but that messes up comparisons). --/  
   
 /a\Cb/8  
     *** Failers  
 No match  
     a\x{100}b  
 No match  
   
 /[^ab\xC0-\xF0]/8SDZ  
 ------------------------------------------------------------------  
         Bra  
         [\x00-`c-\xbf\xf1-\xff] (neg)  
         Ket  
         End  
 ------------------------------------------------------------------  
300  Capturing subpattern count = 0  Capturing subpattern count = 0
301  Options: utf  No options
302  No first char  No first char
303  No need char  No need char
304  Subject length lower bound = 1  Subject length lower bound = 1
 Starting byte set: \x00 \x01 \x02 \x03 \x04 \x05 \x06 \x07 \x08 \x09 \x0a  
   \x0b \x0c \x0d \x0e \x0f \x10 \x11 \x12 \x13 \x14 \x15 \x16 \x17 \x18 \x19  
   \x1a \x1b \x1c \x1d \x1e \x1f \x20 ! " # $ % & ' ( ) * + , - . / 0 1 2 3 4  
   5 6 7 8 9 : ; < = > ? @ A B C D E F G H I J K L M N O P Q R S T U V W X Y  
   Z [ \ ] ^ _ ` c d e f g h i j k l m n o p q r s t u v w x y z { | } ~ \x7f  
   \xc2 \xc3 \xc4 \xc5 \xc6 \xc7 \xc8 \xc9 \xca \xcb \xcc \xcd \xce \xcf \xd0  
   \xd1 \xd2 \xd3 \xd4 \xd5 \xd6 \xd7 \xd8 \xd9 \xda \xdb \xdc \xdd \xde \xdf  
   \xe0 \xe1 \xe2 \xe3 \xe4 \xe5 \xe6 \xe7 \xe8 \xe9 \xea \xeb \xec \xed \xee  
   \xef \xf0 \xf1 \xf2 \xf3 \xf4 \xf5 \xf6 \xf7 \xf8 \xf9 \xfa \xfb \xfc \xfd  
   \xfe \xff  
     \x{f1}  
  0: \x{f1}  
     \x{bf}  
  0: \x{bf}  
     \x{100}  
  0: \x{100}  
     \x{1000}  
  0: \x{1000}  
     *** Failers  
  0: *  
     \x{c0}  
 No match  
     \x{f0}  
 No match  
   
 /Ā{3,4}/8SDZ  
 ------------------------------------------------------------------  
         Bra  
         \x{100}{3}  
         \x{100}?  
         Ket  
         End  
 ------------------------------------------------------------------  
 Capturing subpattern count = 0  
 Options: utf  
 First char = \x{c4}  
 Need char = 128  
 Subject length lower bound = 3  
305  No set of starting bytes  No set of starting bytes
306    \x{100}\x{100}\x{100}\x{100\x{100}      \x{1680}\x{180e}\x{167f}\x{1681}\x{180d}\x{180f}
307   0: \x{100}\x{100}\x{100}   0: \x{167f}\x{1681}\x{180d}\x{180f}
308        \x{2000}\x{200a}\x{1fff}\x{200b}
309     0: \x{1fff}\x{200b}
310        \x{202f}\x{205f}\x{202e}\x{2030}\x{205e}\x{2060}
311     0: \x{202e}\x{2030}\x{205e}\x{2060}
312        \xa0\x{3000}\x9f\xa1\x{2fff}\x{3001}
313     0: \x9f\xa1\x{2fff}\x{3001}
314    
315    /[\H\x{d800}]+/
316        \x{1680}\x{180e}\x{167f}\x{1681}\x{180d}\x{180f}
317     0: \x{167f}\x{1681}\x{180d}\x{180f}
318        \x{2000}\x{200a}\x{1fff}\x{200b}
319     0: \x{1fff}\x{200b}
320        \x{202f}\x{205f}\x{202e}\x{2030}\x{205e}\x{2060}
321     0: \x{202e}\x{2030}\x{205e}\x{2060}
322        \xa0\x{3000}\x9f\xa1\x{2fff}\x{3001}
323     0: \x9f\xa1\x{2fff}\x{3001}
324    
325  /(\x{100}+|x)/8SDZ  /\v+/SI
326  ------------------------------------------------------------------  Capturing subpattern count = 0
327          Bra  No options
         CBra 1  
         \x{100}+  
         Alt  
         x  
         Ket  
         Ket  
         End  
 ------------------------------------------------------------------  
 Capturing subpattern count = 1  
 Options: utf  
328  No first char  No first char
329  No need char  No need char
330  Subject length lower bound = 1  Subject length lower bound = 1
331  Starting byte set: x \xc4  Starting byte set: \x0a \x0b \x0c \x0d \x85 \xff
332        \x{2027}\x{2030}\x{2028}\x{2029}
333     0: \x{2028}\x{2029}
334        \x09\x0e\x84\x86\x85\x0a\x0b\x0c\x0d
335     0: \x85\x0a\x0b\x0c\x0d
336    
337  /(\x{100}*a|x)/8SDZ  /[\v\x{dc00}]+/BZSI
338  ------------------------------------------------------------------  ------------------------------------------------------------------
339          Bra          Bra
340          CBra 1          [\x0a-\x0d\x85\x{2028}-\x{2029}\x{dc00}]++
         \x{100}*+  
         a  
         Alt  
         x  
         Ket  
341          Ket          Ket
342          End          End
343  ------------------------------------------------------------------  ------------------------------------------------------------------
344  Capturing subpattern count = 1  Capturing subpattern count = 0
345  Options: utf  No options
346  No first char  No first char
347  No need char  No need char
348  Subject length lower bound = 1  Subject length lower bound = 1
349  Starting byte set: a x \xc4  No set of starting bytes
350        \x{2027}\x{2030}\x{2028}\x{2029}
351     0: \x{2028}\x{2029}
352        \x09\x0e\x84\x86\x85\x0a\x0b\x0c\x0d
353     0: \x85\x0a\x0b\x0c\x0d
354    
355  /(\x{100}{0,2}a|x)/8SDZ  /\V+/SI
356  ------------------------------------------------------------------  Capturing subpattern count = 0
357          Bra  No options
         CBra 1  
         \x{100}{0,2}  
         a  
         Alt  
         x  
         Ket  
         Ket  
         End  
 ------------------------------------------------------------------  
 Capturing subpattern count = 1  
 Options: utf  
358  No first char  No first char
359  No need char  No need char
360  Subject length lower bound = 1  Subject length lower bound = 1
361  Starting byte set: a x \xc4  No set of starting bytes
362        \x{2028}\x{2029}\x{2027}\x{2030}
363     0: \x{2027}\x{2030}
364        \x85\x0a\x0b\x0c\x0d\x09\x0e\x84\x86
365     0: \x09\x0e\x84\x86
366    
367  /(\x{100}{1,2}a|x)/8SDZ  /[\V\x{d800}]+/
368  ------------------------------------------------------------------      \x{2028}\x{2029}\x{2027}\x{2030}
369          Bra   0: \x{2027}\x{2030}
370          CBra 1      \x85\x0a\x0b\x0c\x0d\x09\x0e\x84\x86
371          \x{100}   0: \x09\x0e\x84\x86
372          \x{100}{0,1}  
373          a  /\R+/SI<bsr_unicode>
374          Alt  Capturing subpattern count = 0
375          x  Options: bsr_unicode
         Ket  
         Ket  
         End  
 ------------------------------------------------------------------  
 Capturing subpattern count = 1  
 Options: utf  
376  No first char  No first char
377  No need char  No need char
378  Subject length lower bound = 1  Subject length lower bound = 1
379  Starting byte set: x \xc4  Starting byte set: \x0a \x0b \x0c \x0d \x85 \xff
380        \x{2027}\x{2030}\x{2028}\x{2029}
381     0: \x{2028}\x{2029}
382        \x09\x0e\x84\x86\x85\x0a\x0b\x0c\x0d
383     0: \x85\x0a\x0b\x0c\x0d
384    
385  /\x{100}/8DZ  /\x{d800}\x{d7ff}\x{dc00}\x{dc00}\x{dcff}\x{dd00}/I
 ------------------------------------------------------------------  
         Bra  
         \x{100}  
         Ket  
         End  
 ------------------------------------------------------------------  
386  Capturing subpattern count = 0  Capturing subpattern count = 0
387  Options: utf  No options
388  First char = \x{c4}  First char = \x{d800}
389  Need char = 128  Need char = \x{dd00}
390        \x{d800}\x{d7ff}\x{dc00}\x{dc00}\x{dcff}\x{dd00}
391     0: \x{d800}\x{d7ff}\x{dc00}\x{dc00}\x{dcff}\x{dd00}
392    
393  /a\x{100}\x{101}*/8DZ  /[^\x{80}][^\x{ff}][^\x{100}][^\x{1000}][^\x{ffff}]/BZ
394  ------------------------------------------------------------------  ------------------------------------------------------------------
395          Bra          Bra
396          a\x{100}          [^\x80]
397          \x{101}*          [^\x{ff}]
398            [^\x{100}]
399            [^\x{1000}]
400            [^\x{ffff}]
401          Ket          Ket
402          End          End
403  ------------------------------------------------------------------  ------------------------------------------------------------------
 Capturing subpattern count = 0  
 Options: utf  
 First char = 'a'  
 Need char = 128  
404    
405  /a\x{100}\x{101}+/8DZ  /[^\x{80}][^\x{ff}][^\x{100}][^\x{1000}][^\x{ffff}]/BZi
406  ------------------------------------------------------------------  ------------------------------------------------------------------
407          Bra          Bra
408          a\x{100}       /i [^\x80]
409          \x{101}+       /i [^\x{ff}]
410         /i [^\x{100}]
411         /i [^\x{1000}]
412         /i [^\x{ffff}]
413          Ket          Ket
414          End          End
415  ------------------------------------------------------------------  ------------------------------------------------------------------
 Capturing subpattern count = 0  
 Options: utf  
 First char = 'a'  
 Need char = 129  
416    
417  /[^\x{c4}]/DZ  /[^\x{100}]*[^\x{1000}]+[^\x{ffff}]??[^\x{8000}]{4,}[^\x{7fff}]{2,9}?[^\x{100}]{5,6}+/BZ
418  ------------------------------------------------------------------  ------------------------------------------------------------------
419          Bra          Bra
420          [^\xc4]          [^\x{100}]*
421            [^\x{1000}]+
422            [^\x{ffff}]??
423            [^\x{8000}]{4}
424            [^\x{8000}]*
425            [^\x{7fff}]{2}
426            [^\x{7fff}]{0,7}?
427            [^\x{100}]{5}
428            [^\x{100}]?+
429          Ket          Ket
430          End          End
431  ------------------------------------------------------------------  ------------------------------------------------------------------
 Capturing subpattern count = 0  
 No options  
 No first char  
 No need char  
432    
433  /[\x{100}]/8DZ  /[^\x{100}]*[^\x{1000}]+[^\x{ffff}]??[^\x{8000}]{4,}[^\x{7fff}]{2,9}?[^\x{100}]{5,6}+/BZi
434  ------------------------------------------------------------------  ------------------------------------------------------------------
435          Bra          Bra
436          \x{100}       /i [^\x{100}]*
437         /i [^\x{1000}]+
438         /i [^\x{ffff}]??
439         /i [^\x{8000}]{4}
440         /i [^\x{8000}]*
441         /i [^\x{7fff}]{2}
442         /i [^\x{7fff}]{0,7}?
443         /i [^\x{100}]{5}
444         /i [^\x{100}]?+
445          Ket          Ket
446          End          End
447  ------------------------------------------------------------------  ------------------------------------------------------------------
 Capturing subpattern count = 0  
 Options: utf  
 First char = \x{c4}  
 Need char = 128  
     \x{100}  
  0: \x{100}  
     Z\x{100}  
  0: \x{100}  
     \x{100}Z  
  0: \x{100}  
     *** Failers  
 No match  
448    
449  /[\xff]/DZ8  /(*:0123456789ABCDEF0123456789ABCDEF0123456789ABCDEF0123456789ABCDEF0123456789ABCDEF0123456789ABCDEF0123456789ABCDEF0123456789ABCDEF0123456789ABCDEF0123456789ABCDEF0123456789ABCDEF0123456789ABCDEF0123456789ABCDEF0123456789ABCDEF0123456789ABCDEF0123456789ABCDEF)XX/K
450        XX
451     0: XX
452    MK: 0123456789ABCDEF0123456789ABCDEF0123456789ABCDEF0123456789ABCDEF0123456789ABCDEF0123456789ABCDEF0123456789ABCDEF0123456789ABCDEF0123456789ABCDEF0123456789ABCDEF0123456789ABCDEF0123456789ABCDEF0123456789ABCDEF0123456789ABCDEF0123456789ABCDEF0123456789ABCDEF
453    
454    /(*:0123456789ABCDEF0123456789ABCDEF0123456789ABCDEF0123456789ABCDEF0123456789ABCDEF0123456789ABCDEF0123456789ABCDEF0123456789ABCDEF0123456789ABCDEF0123456789ABCDEF0123456789ABCDEF0123456789ABCDEF0123456789ABCDEF0123456789ABCDEF0123456789ABCDEF0123456789ABCDE)XX/K
455        XX
456     0: XX
457    MK: 0123456789ABCDEF0123456789ABCDEF0123456789ABCDEF0123456789ABCDEF0123456789ABCDEF0123456789ABCDEF0123456789ABCDEF0123456789ABCDEF0123456789ABCDEF0123456789ABCDEF0123456789ABCDEF0123456789ABCDEF0123456789ABCDEF0123456789ABCDEF0123456789ABCDEF0123456789ABCDE
458    
459    /\u0100/<JS>BZ
460  ------------------------------------------------------------------  ------------------------------------------------------------------
461          Bra          Bra
462          \x{ff}          \x{100}
463          Ket          Ket
464          End          End
465  ------------------------------------------------------------------  ------------------------------------------------------------------
 Capturing subpattern count = 0  
 Options: utf  
 First char = \x{c3}  
 Need char = 191  
     >\x{ff}<  
  0: \x{ff}  
466    
467  /[^\xff]/8DZ  /[\u0100-\u0200]/<JS>BZ
468  ------------------------------------------------------------------  ------------------------------------------------------------------
469          Bra          Bra
470          [\x00-\xfe] (neg)          [\x{100}-\x{200}]
471          Ket          Ket
472          End          End
473  ------------------------------------------------------------------  ------------------------------------------------------------------
 Capturing subpattern count = 0  
 Options: utf  
 No first char  
 No need char  
474    
475  /\x{100}abc(xyz(?1))/8DZ  /\ud800/<JS>BZ
476  ------------------------------------------------------------------  ------------------------------------------------------------------
477          Bra          Bra
478          \x{100}abc          \x{d800}
         CBra 1  
         xyz  
         Recurse  
         Ket  
479          Ket          Ket
480          End          End
481  ------------------------------------------------------------------  ------------------------------------------------------------------
 Capturing subpattern count = 1  
 Options: utf  
 First char = \x{c4}  
 Need char = 'z'  
482    
483  /a\x{1234}b/P8  /^\x{ffff}+/i
484      a\x{1234}b      \x{ffff}
485   0: a\x{1234}b   0: \x{ffff}
486    
487  /\777/8I  /^\x{ffff}?/i
488  Capturing subpattern count = 0      \x{ffff}
489  Options: utf   0: \x{ffff}
490  First char = \x{c7}  
491  Need char = 191  /^\x{ffff}*/i
492    \x{1ff}      \x{ffff}
493   0: \x{1ff}   0: \x{ffff}
494    \777  
495   0: \x{1ff}  /^\x{ffff}{3}/i
496        \x{ffff}\x{ffff}\x{ffff}
497  /\x{100}+\x{200}/8DZ   0: \x{ffff}\x{ffff}\x{ffff}
498  ------------------------------------------------------------------  
499          Bra  /^\x{ffff}{0,3}/i
500          \x{100}++      \x{ffff}
501          \x{200}   0: \x{ffff}
         Ket  
         End  
 ------------------------------------------------------------------  
 Capturing subpattern count = 0  
 Options: utf  
 First char = \x{c4}  
 Need char = 128  
502    
503  /\x{100}+X/8DZ  /[^\x00-a]{12,}[^b-\xff]*/BZ
504  ------------------------------------------------------------------  ------------------------------------------------------------------
505          Bra          Bra
506          \x{100}++          [b-\xff] (neg){12,}
507          X          [\x00-a] (neg)*+
508          Ket          Ket
509          End          End
510  ------------------------------------------------------------------  ------------------------------------------------------------------
 Capturing subpattern count = 0  
 Options: utf  
 First char = \x{c4}  
 Need char = 'X'  
   
 /^[\QĀ\E-\QŐ\E/BZ8  
 Failed: missing terminating ] for character class at offset 15  
   
 /-- This tests the stricter UTF-8 check according to RFC 3629. --/  
   
 /X/8  
     \x{0}\x{d7ff}\x{e000}\x{10ffff}  
 No match  
     \x{d800}  
 Error -10 (bad UTF-8 string) offset=0 reason=14  
     \x{d800}\?  
 No match  
     \x{da00}  
 Error -10 (bad UTF-8 string) offset=0 reason=14  
     \x{da00}\?  
 No match  
     \x{dfff}  
 Error -10 (bad UTF-8 string) offset=0 reason=14  
     \x{dfff}\?  
 No match  
     \x{110000}  
 Error -10 (bad UTF-8 string) offset=0 reason=13  
     \x{110000}\?  
 No match  
     \x{2000000}  
 Error -10 (bad UTF-8 string) offset=0 reason=11  
     \x{2000000}\?  
 No match  
     \x{7fffffff}  
 Error -10 (bad UTF-8 string) offset=0 reason=12  
     \x{7fffffff}\?  
 No match  
511    
512  /(*UTF8)\x{1234}/  /[^\s]*\s* [^\W]+\W+ [^\d]*?\d0 [^\d\w]{4,6}?\w*A/BZ
   abcd\x{1234}pqr  
  0: \x{1234}  
   
 /(*CRLF)(*UTF8)(*BSR_UNICODE)a\Rb/I  
 Capturing subpattern count = 0  
 Options: bsr_unicode utf  
 Forced newline sequence: CRLF  
 First char = 'a'  
 Need char = 'b'  
   
 /\h/SI8  
 Capturing subpattern count = 0  
 Options: utf  
 No first char  
 No need char  
 Subject length lower bound = 1  
 Starting byte set: \x09 \x20 \xc2 \xe1 \xe2 \xe3  
     ABC\x{09}  
  0: \x{09}  
     ABC\x{20}  
  0:  
     ABC\x{a0}  
  0: \x{a0}  
     ABC\x{1680}  
  0: \x{1680}  
     ABC\x{180e}  
  0: \x{180e}  
     ABC\x{2000}  
  0: \x{2000}  
     ABC\x{202f}  
  0: \x{202f}  
     ABC\x{205f}  
  0: \x{205f}  
     ABC\x{3000}  
  0: \x{3000}  
   
 /\v/SI8  
 Capturing subpattern count = 0  
 Options: utf  
 No first char  
 No need char  
 Subject length lower bound = 1  
 Starting byte set: \x0a \x0b \x0c \x0d \xc2 \xe2  
     ABC\x{0a}  
  0: \x{0a}  
     ABC\x{0b}  
  0: \x{0b}  
     ABC\x{0c}  
  0: \x{0c}  
     ABC\x{0d}  
  0: \x{0d}  
     ABC\x{85}  
  0: \x{85}  
     ABC\x{2028}  
  0: \x{2028}  
   
 /\h*A/SI8  
 Capturing subpattern count = 0  
 Options: utf  
 No first char  
 Need char = 'A'  
 Subject length lower bound = 1  
 Starting byte set: \x09 \x20 A \xc2 \xe1 \xe2 \xe3  
     CDBABC  
  0: A  
   
 /\v+A/SI8  
 Capturing subpattern count = 0  
 Options: utf  
 No first char  
 Need char = 'A'  
 Subject length lower bound = 2  
 Starting byte set: \x0a \x0b \x0c \x0d \xc2 \xe2  
   
 /\s?xxx\s/8SI  
 Capturing subpattern count = 0  
 Options: utf  
 No first char  
 Need char = 'x'  
 Subject length lower bound = 4  
 Starting byte set: \x09 \x0a \x0c \x0d \x20 x  
   
 /\sxxx\s/I8ST1  
 Capturing subpattern count = 0  
 Options: utf  
 No first char  
 Need char = 'x'  
 Subject length lower bound = 5  
 Starting byte set: \x09 \x0a \x0c \x0d \x20 \xc2  
     AB\x{85}xxx\x{a0}XYZ  
  0: \x{85}xxx\x{a0}  
     AB\x{a0}xxx\x{85}XYZ  
  0: \x{a0}xxx\x{85}  
   
 /\S \S/I8ST1  
 Capturing subpattern count = 0  
 Options: utf  
 No first char  
 Need char = ' '  
 Subject length lower bound = 3  
 Starting byte set: \x00 \x01 \x02 \x03 \x04 \x05 \x06 \x07 \x08 \x0b \x0e  
   \x0f \x10 \x11 \x12 \x13 \x14 \x15 \x16 \x17 \x18 \x19 \x1a \x1b \x1c \x1d  
   \x1e \x1f ! " # $ % & ' ( ) * + , - . / 0 1 2 3 4 5 6 7 8 9 : ; < = > ? @  
   A B C D E F G H I J K L M N O P Q R S T U V W X Y Z [ \ ] ^ _ ` a b c d e  
   f g h i j k l m n o p q r s t u v w x y z { | } ~ \x7f \xc0 \xc1 \xc2 \xc3  
   \xc4 \xc5 \xc6 \xc7 \xc8 \xc9 \xca \xcb \xcc \xcd \xce \xcf \xd0 \xd1 \xd2  
   \xd3 \xd4 \xd5 \xd6 \xd7 \xd8 \xd9 \xda \xdb \xdc \xdd \xde \xdf \xe0 \xe1  
   \xe2 \xe3 \xe4 \xe5 \xe6 \xe7 \xe8 \xe9 \xea \xeb \xec \xed \xee \xef \xf0  
   \xf1 \xf2 \xf3 \xf4 \xf5 \xf6 \xf7 \xf8 \xf9 \xfa \xfb \xfc \xfd \xfe \xff  
     \x{a2} \x{84}  
  0: \x{a2} \x{84}  
     A Z  
  0: A Z  
   
 /a+/8  
     a\x{123}aa\>1  
  0: aa  
     a\x{123}aa\>2  
 Error -11 (bad UTF-8 offset)  
     a\x{123}aa\>3  
  0: aa  
     a\x{123}aa\>4  
  0: a  
     a\x{123}aa\>5  
 No match  
     a\x{123}aa\>6  
 Error -24 (bad offset value)  
   
 /\x{1234}+/iS8I  
 Capturing subpattern count = 0  
 Options: caseless utf  
 No first char  
 No need char  
 Subject length lower bound = 1  
 Starting byte set: \xe1  
   
 /\x{1234}+?/iS8I  
 Capturing subpattern count = 0  
 Options: caseless utf  
 No first char  
 No need char  
 Subject length lower bound = 1  
 Starting byte set: \xe1  
   
 /\x{1234}++/iS8I  
 Capturing subpattern count = 0  
 Options: caseless utf  
 No first char  
 No need char  
 Subject length lower bound = 1  
 Starting byte set: \xe1  
   
 /\x{1234}{2}/iS8I  
 Capturing subpattern count = 0  
 Options: caseless utf  
 No first char  
 No need char  
 Subject length lower bound = 2  
 Starting byte set: \xe1  
   
 /[^\x{c4}]/8DZ  
513  ------------------------------------------------------------------  ------------------------------------------------------------------
514          Bra          Bra
515          [\x00-\xc3\xc5-\xff] (neg)          [\x00-\x08\x0e-\x1f!-\xff] (neg)*
516            \s*
517    
518            [0-9A-Z_a-z]++
519            \W+
520    
521            [\x00-/:-\xff] (neg)*?
522            \d
523            0
524            [\x00-/:-@[-^`{-\xff] (neg){4,6}?
525            \w*
526            A
527          Ket          Ket
528          End          End
529  ------------------------------------------------------------------  ------------------------------------------------------------------
 Capturing subpattern count = 0  
 Options: utf  
 No first char  
 No need char  
530    
531  /X+\x{200}/8DZ  /a*[b-\x{200}]?a#a*[b-\x{200}]?b#[a-f]*[g-\x{200}]*#[g-\x{200}]*[a-c]*#[g-\x{200}]*[a-h]*/BZ
532  ------------------------------------------------------------------  ------------------------------------------------------------------
533          Bra          Bra
534          X++          a*
535          \x{200}          [b-\x{200}]?+
536            a#
537            a*+
538            [b-\x{200}]?
539            b#
540            [a-f]*
541            [g-\x{200}]*+
542            #
543            [g-\x{200}]*
544            [a-c]*+
545            #
546            [g-\x{200}]*
547            [a-h]*+
548          Ket          Ket
549          End          End
550  ------------------------------------------------------------------  ------------------------------------------------------------------
 Capturing subpattern count = 0  
 Options: utf  
 First char = 'X'  
 Need char = 128  
   
 /\R/SI8  
 Capturing subpattern count = 0  
 Options: utf  
 No first char  
 No need char  
 Subject length lower bound = 1  
 Starting byte set: \x0a \x0b \x0c \x0d \xc2 \xe2  
551    
552  /-- End of testinput17 --/  /-- End of testinput17 --/

Legend:
Removed from v.810  
changed lines
  Added in v.1382

  ViewVC Help
Powered by ViewVC 1.1.5