/[pcre]/code/trunk/testdata/testoutput17
ViewVC logotype

Contents of /code/trunk/testdata/testoutput17

Parent Directory Parent Directory | Revision Log Revision Log


Revision 827 - (hide annotations) (download)
Tue Dec 27 10:51:09 2011 UTC (2 years, 10 months ago) by ph10
Original Path: code/branches/pcre16/testdata/testoutput17
File size: 13901 byte(s)
Update pcretest for non-UTF 16-bit wide values, for testing table-lookups 
better. Add tests for bad mode.

1 ph10 814 /-- This set of tests is for the 16-bit library's basic (non-UTF-16) features
2 ph10 823 that are not compatible with the 8-bit library, or which give different
3     output in 16-bit mode. --/
4 ph10 810
5     /a\Cb/
6     aXb
7     0: aXb
8     a\nb
9     0: a\x0ab
10    
11 ph10 814 /-- Check maximum non-UTF character size --/
12 ph10 810
13 ph10 814 /\x{ffff}/
14     A\x{ffff}B
15 ph10 827 0: \x{ffff}
16 ph10 810
17 ph10 814 /\x{10000}/
18     Failed: character value in \x{...} sequence is too large at offset 8
19 ph10 810
20     /[^\x{c4}]/DZ
21     ------------------------------------------------------------------
22     Bra
23     [^\xc4]
24     Ket
25     End
26     ------------------------------------------------------------------
27     Capturing subpattern count = 0
28     No options
29     No first char
30     No need char
31    
32 ph10 818
33     /\x{100}/I
34     Capturing subpattern count = 0
35     No options
36     First char = \x{100}
37     No need char
38    
39     / (?: [\040\t] | \(
40     (?: [^\\\x80-\xff\n\015()] | \\ [^\x80-\xff] | \( (?: [^\\\x80-\xff\n\015()] | \\ [^\x80-\xff] )* \) )*
41     \) )* # optional leading comment
42     (?: (?:
43     [^(\040)<>@,;:".\\\[\]\000-\037\x80-\xff]+ # some number of atom characters...
44     (?![^(\040)<>@,;:".\\\[\]\000-\037\x80-\xff]) # ..not followed by something that could be part of an atom
45     |
46     " (?: # opening quote...
47     [^\\\x80-\xff\n\015"] # Anything except backslash and quote
48     | # or
49     \\ [^\x80-\xff] # Escaped something (something != CR)
50     )* " # closing quote
51     ) # initial word
52     (?: (?: [\040\t] | \(
53     (?: [^\\\x80-\xff\n\015()] | \\ [^\x80-\xff] | \( (?: [^\\\x80-\xff\n\015()] | \\ [^\x80-\xff] )* \) )*
54     \) )* \. (?: [\040\t] | \(
55     (?: [^\\\x80-\xff\n\015()] | \\ [^\x80-\xff] | \( (?: [^\\\x80-\xff\n\015()] | \\ [^\x80-\xff] )* \) )*
56     \) )* (?:
57     [^(\040)<>@,;:".\\\[\]\000-\037\x80-\xff]+ # some number of atom characters...
58     (?![^(\040)<>@,;:".\\\[\]\000-\037\x80-\xff]) # ..not followed by something that could be part of an atom
59     |
60     " (?: # opening quote...
61     [^\\\x80-\xff\n\015"] # Anything except backslash and quote
62     | # or
63     \\ [^\x80-\xff] # Escaped something (something != CR)
64     )* " # closing quote
65     ) )* # further okay, if led by a period
66     (?: [\040\t] | \(
67     (?: [^\\\x80-\xff\n\015()] | \\ [^\x80-\xff] | \( (?: [^\\\x80-\xff\n\015()] | \\ [^\x80-\xff] )* \) )*
68     \) )* @ (?: [\040\t] | \(
69     (?: [^\\\x80-\xff\n\015()] | \\ [^\x80-\xff] | \( (?: [^\\\x80-\xff\n\015()] | \\ [^\x80-\xff] )* \) )*
70     \) )* (?:
71     [^(\040)<>@,;:".\\\[\]\000-\037\x80-\xff]+ # some number of atom characters...
72     (?![^(\040)<>@,;:".\\\[\]\000-\037\x80-\xff]) # ..not followed by something that could be part of an atom
73     | \[ # [
74     (?: [^\\\x80-\xff\n\015\[\]] | \\ [^\x80-\xff] )* # stuff
75     \] # ]
76     ) # initial subdomain
77     (?: #
78     (?: [\040\t] | \(
79     (?: [^\\\x80-\xff\n\015()] | \\ [^\x80-\xff] | \( (?: [^\\\x80-\xff\n\015()] | \\ [^\x80-\xff] )* \) )*
80     \) )* \. # if led by a period...
81     (?: [\040\t] | \(
82     (?: [^\\\x80-\xff\n\015()] | \\ [^\x80-\xff] | \( (?: [^\\\x80-\xff\n\015()] | \\ [^\x80-\xff] )* \) )*
83     \) )* (?:
84     [^(\040)<>@,;:".\\\[\]\000-\037\x80-\xff]+ # some number of atom characters...
85     (?![^(\040)<>@,;:".\\\[\]\000-\037\x80-\xff]) # ..not followed by something that could be part of an atom
86     | \[ # [
87     (?: [^\\\x80-\xff\n\015\[\]] | \\ [^\x80-\xff] )* # stuff
88     \] # ]
89     ) # ...further okay
90     )*
91     # address
92     | # or
93     (?:
94     [^(\040)<>@,;:".\\\[\]\000-\037\x80-\xff]+ # some number of atom characters...
95     (?![^(\040)<>@,;:".\\\[\]\000-\037\x80-\xff]) # ..not followed by something that could be part of an atom
96     |
97     " (?: # opening quote...
98     [^\\\x80-\xff\n\015"] # Anything except backslash and quote
99     | # or
100     \\ [^\x80-\xff] # Escaped something (something != CR)
101     )* " # closing quote
102     ) # one word, optionally followed by....
103     (?:
104     [^()<>@,;:".\\\[\]\x80-\xff\000-\010\012-\037] | # atom and space parts, or...
105     \(
106     (?: [^\\\x80-\xff\n\015()] | \\ [^\x80-\xff] | \( (?: [^\\\x80-\xff\n\015()] | \\ [^\x80-\xff] )* \) )*
107     \) | # comments, or...
108    
109     " (?: # opening quote...
110     [^\\\x80-\xff\n\015"] # Anything except backslash and quote
111     | # or
112     \\ [^\x80-\xff] # Escaped something (something != CR)
113     )* " # closing quote
114     # quoted strings
115     )*
116     < (?: [\040\t] | \(
117     (?: [^\\\x80-\xff\n\015()] | \\ [^\x80-\xff] | \( (?: [^\\\x80-\xff\n\015()] | \\ [^\x80-\xff] )* \) )*
118     \) )* # leading <
119     (?: @ (?: [\040\t] | \(
120     (?: [^\\\x80-\xff\n\015()] | \\ [^\x80-\xff] | \( (?: [^\\\x80-\xff\n\015()] | \\ [^\x80-\xff] )* \) )*
121     \) )* (?:
122     [^(\040)<>@,;:".\\\[\]\000-\037\x80-\xff]+ # some number of atom characters...
123     (?![^(\040)<>@,;:".\\\[\]\000-\037\x80-\xff]) # ..not followed by something that could be part of an atom
124     | \[ # [
125     (?: [^\\\x80-\xff\n\015\[\]] | \\ [^\x80-\xff] )* # stuff
126     \] # ]
127     ) # initial subdomain
128     (?: #
129     (?: [\040\t] | \(
130     (?: [^\\\x80-\xff\n\015()] | \\ [^\x80-\xff] | \( (?: [^\\\x80-\xff\n\015()] | \\ [^\x80-\xff] )* \) )*
131     \) )* \. # if led by a period...
132     (?: [\040\t] | \(
133     (?: [^\\\x80-\xff\n\015()] | \\ [^\x80-\xff] | \( (?: [^\\\x80-\xff\n\015()] | \\ [^\x80-\xff] )* \) )*
134     \) )* (?:
135     [^(\040)<>@,;:".\\\[\]\000-\037\x80-\xff]+ # some number of atom characters...
136     (?![^(\040)<>@,;:".\\\[\]\000-\037\x80-\xff]) # ..not followed by something that could be part of an atom
137     | \[ # [
138     (?: [^\\\x80-\xff\n\015\[\]] | \\ [^\x80-\xff] )* # stuff
139     \] # ]
140     ) # ...further okay
141     )*
142    
143     (?: (?: [\040\t] | \(
144     (?: [^\\\x80-\xff\n\015()] | \\ [^\x80-\xff] | \( (?: [^\\\x80-\xff\n\015()] | \\ [^\x80-\xff] )* \) )*
145     \) )* , (?: [\040\t] | \(
146     (?: [^\\\x80-\xff\n\015()] | \\ [^\x80-\xff] | \( (?: [^\\\x80-\xff\n\015()] | \\ [^\x80-\xff] )* \) )*
147     \) )* @ (?: [\040\t] | \(
148     (?: [^\\\x80-\xff\n\015()] | \\ [^\x80-\xff] | \( (?: [^\\\x80-\xff\n\015()] | \\ [^\x80-\xff] )* \) )*
149     \) )* (?:
150     [^(\040)<>@,;:".\\\[\]\000-\037\x80-\xff]+ # some number of atom characters...
151     (?![^(\040)<>@,;:".\\\[\]\000-\037\x80-\xff]) # ..not followed by something that could be part of an atom
152     | \[ # [
153     (?: [^\\\x80-\xff\n\015\[\]] | \\ [^\x80-\xff] )* # stuff
154     \] # ]
155     ) # initial subdomain
156     (?: #
157     (?: [\040\t] | \(
158     (?: [^\\\x80-\xff\n\015()] | \\ [^\x80-\xff] | \( (?: [^\\\x80-\xff\n\015()] | \\ [^\x80-\xff] )* \) )*
159     \) )* \. # if led by a period...
160     (?: [\040\t] | \(
161     (?: [^\\\x80-\xff\n\015()] | \\ [^\x80-\xff] | \( (?: [^\\\x80-\xff\n\015()] | \\ [^\x80-\xff] )* \) )*
162     \) )* (?:
163     [^(\040)<>@,;:".\\\[\]\000-\037\x80-\xff]+ # some number of atom characters...
164     (?![^(\040)<>@,;:".\\\[\]\000-\037\x80-\xff]) # ..not followed by something that could be part of an atom
165     | \[ # [
166     (?: [^\\\x80-\xff\n\015\[\]] | \\ [^\x80-\xff] )* # stuff
167     \] # ]
168     ) # ...further okay
169     )*
170     )* # further okay, if led by comma
171     : # closing colon
172     (?: [\040\t] | \(
173     (?: [^\\\x80-\xff\n\015()] | \\ [^\x80-\xff] | \( (?: [^\\\x80-\xff\n\015()] | \\ [^\x80-\xff] )* \) )*
174     \) )* )? # optional route
175     (?:
176     [^(\040)<>@,;:".\\\[\]\000-\037\x80-\xff]+ # some number of atom characters...
177     (?![^(\040)<>@,;:".\\\[\]\000-\037\x80-\xff]) # ..not followed by something that could be part of an atom
178     |
179     " (?: # opening quote...
180     [^\\\x80-\xff\n\015"] # Anything except backslash and quote
181     | # or
182     \\ [^\x80-\xff] # Escaped something (something != CR)
183     )* " # closing quote
184     ) # initial word
185     (?: (?: [\040\t] | \(
186     (?: [^\\\x80-\xff\n\015()] | \\ [^\x80-\xff] | \( (?: [^\\\x80-\xff\n\015()] | \\ [^\x80-\xff] )* \) )*
187     \) )* \. (?: [\040\t] | \(
188     (?: [^\\\x80-\xff\n\015()] | \\ [^\x80-\xff] | \( (?: [^\\\x80-\xff\n\015()] | \\ [^\x80-\xff] )* \) )*
189     \) )* (?:
190     [^(\040)<>@,;:".\\\[\]\000-\037\x80-\xff]+ # some number of atom characters...
191     (?![^(\040)<>@,;:".\\\[\]\000-\037\x80-\xff]) # ..not followed by something that could be part of an atom
192     |
193     " (?: # opening quote...
194     [^\\\x80-\xff\n\015"] # Anything except backslash and quote
195     | # or
196     \\ [^\x80-\xff] # Escaped something (something != CR)
197     )* " # closing quote
198     ) )* # further okay, if led by a period
199     (?: [\040\t] | \(
200     (?: [^\\\x80-\xff\n\015()] | \\ [^\x80-\xff] | \( (?: [^\\\x80-\xff\n\015()] | \\ [^\x80-\xff] )* \) )*
201     \) )* @ (?: [\040\t] | \(
202     (?: [^\\\x80-\xff\n\015()] | \\ [^\x80-\xff] | \( (?: [^\\\x80-\xff\n\015()] | \\ [^\x80-\xff] )* \) )*
203     \) )* (?:
204     [^(\040)<>@,;:".\\\[\]\000-\037\x80-\xff]+ # some number of atom characters...
205     (?![^(\040)<>@,;:".\\\[\]\000-\037\x80-\xff]) # ..not followed by something that could be part of an atom
206     | \[ # [
207     (?: [^\\\x80-\xff\n\015\[\]] | \\ [^\x80-\xff] )* # stuff
208     \] # ]
209     ) # initial subdomain
210     (?: #
211     (?: [\040\t] | \(
212     (?: [^\\\x80-\xff\n\015()] | \\ [^\x80-\xff] | \( (?: [^\\\x80-\xff\n\015()] | \\ [^\x80-\xff] )* \) )*
213     \) )* \. # if led by a period...
214     (?: [\040\t] | \(
215     (?: [^\\\x80-\xff\n\015()] | \\ [^\x80-\xff] | \( (?: [^\\\x80-\xff\n\015()] | \\ [^\x80-\xff] )* \) )*
216     \) )* (?:
217     [^(\040)<>@,;:".\\\[\]\000-\037\x80-\xff]+ # some number of atom characters...
218     (?![^(\040)<>@,;:".\\\[\]\000-\037\x80-\xff]) # ..not followed by something that could be part of an atom
219     | \[ # [
220     (?: [^\\\x80-\xff\n\015\[\]] | \\ [^\x80-\xff] )* # stuff
221     \] # ]
222     ) # ...further okay
223     )*
224     # address spec
225     (?: [\040\t] | \(
226     (?: [^\\\x80-\xff\n\015()] | \\ [^\x80-\xff] | \( (?: [^\\\x80-\xff\n\015()] | \\ [^\x80-\xff] )* \) )*
227     \) )* > # trailing >
228     # name and address
229     ) (?: [\040\t] | \(
230     (?: [^\\\x80-\xff\n\015()] | \\ [^\x80-\xff] | \( (?: [^\\\x80-\xff\n\015()] | \\ [^\x80-\xff] )* \) )*
231     \) )* # optional trailing comment
232     /xSI
233     Capturing subpattern count = 0
234     Contains explicit CR or LF match
235     Options: extended
236     No first char
237     No need char
238     Subject length lower bound = 3
239     Starting byte set: \x09 \x20 ! " # $ % & ' ( * + - / 0 1 2 3 4 5 6 7 8
240     9 = ? A B C D E F G H I J K L M N O P Q R S T U V W X Y Z ^ _ ` a b c d e
241     f g h i j k l m n o p q r s t u v w x y z { | } ~ \x7f \xff
242    
243 ph10 827 <testdata/saved8
244     Compiled pattern loaded from testdata/saved8
245     No study data
246     Error -28 from pcre16_fullinfo(0)
247     Running in 16-bit mode but pattern was compiled in 8-bit mode
248    
249 zherczeg 825 /\h/SI
250     Capturing subpattern count = 0
251     No options
252     No first char
253     No need char
254     Subject length lower bound = 1
255     Starting byte set: \x09 \x20 \xa0 \xff
256    
257     /\v/SI
258     Capturing subpattern count = 0
259     No options
260     No first char
261     No need char
262     Subject length lower bound = 1
263     Starting byte set: \x0a \x0b \x0c \x0d \x85 \xff
264    
265     /\R/SI
266     Capturing subpattern count = 0
267     No options
268     No first char
269     No need char
270     Subject length lower bound = 1
271     Starting byte set: \x0a \x0b \x0c \x0d \x85 \xff
272    
273 zherczeg 826 /[\h]/BZ
274     ------------------------------------------------------------------
275     Bra
276     [\x09 \xa0\x{1680}\x{180e}\x{2000}-\x{200a}\x{202f}\x{205f}\x{3000}]
277     Ket
278     End
279     ------------------------------------------------------------------
280     >\x09<
281     0: \x09
282    
283     /[\h]+/BZ
284     ------------------------------------------------------------------
285     Bra
286     [\x09 \xa0\x{1680}\x{180e}\x{2000}-\x{200a}\x{202f}\x{205f}\x{3000}]+
287     Ket
288     End
289     ------------------------------------------------------------------
290     >\x09\x20\xa0<
291     0: \x09 \xa0
292    
293     /[\v]/BZ
294     ------------------------------------------------------------------
295     Bra
296     [\x0a-\x0d\x85\x{2028}-\x{2029}]
297     Ket
298     End
299     ------------------------------------------------------------------
300    
301     /[\H]/BZ
302     ------------------------------------------------------------------
303     Bra
304     [\x00-\x08\x0a-\x1f!-\x9f\xa1-\xff\x{100}-\x{167f}\x{1681}-\x{180d}\x{180f}-\x{1fff}\x{200b}-\x{202e}\x{2030}-\x{205e}\x{2060}-\x{2fff}\x{3001}-\x{ffff}]
305     Ket
306     End
307     ------------------------------------------------------------------
308    
309     /[^\h]/BZ
310     ------------------------------------------------------------------
311     Bra
312     [^\x09 \xa0\x{1680}\x{180e}\x{2000}-\x{200a}\x{202f}\x{205f}\x{3000}]
313     Ket
314     End
315     ------------------------------------------------------------------
316    
317     /[\V]/BZ
318     ------------------------------------------------------------------
319     Bra
320     [\x00-\x09\x0e-\x84\x86-\xff\x{100}-\x{2027}\x{202a}-\x{ffff}]
321     Ket
322     End
323     ------------------------------------------------------------------
324    
325     /[\x0a\V]/BZ
326     ------------------------------------------------------------------
327     Bra
328     [\x00-\x0a\x0e-\x84\x86-\xff\x{100}-\x{2027}\x{202a}-\x{ffff}]
329     Ket
330     End
331     ------------------------------------------------------------------
332    
333 ph10 810 /-- End of testinput17 --/

webmaster@exim.org
ViewVC Help
Powered by ViewVC 1.1.12