1#!./perl
2
3BEGIN {
4    require Config;
5    if (($Config::Config{'extensions'} !~ /\bre\b/) ){
6	print "1..0 # Skip -- Perl configured without re module\n";
7	exit 0;
8    }
9}
10
11use strict;
12BEGIN { require "../../t/test.pl"; }
13our $NUM_SECTS;
14chomp(my @strs= grep { !/^\s*\#/ } <DATA>);
15my $out = runperl(progfile => "t/regop.pl", stderr => 1 );
16# VMS currently embeds linefeeds in the output.
17$out =~ s/\cJ//g if $^O eq 'VMS';
18my @tests = grep { /\S/ } split /(?=Compiling REx)/, $out;
19# on debug builds we get an EXECUTING... message in there at the top
20shift @tests
21    if $tests[0] =~ /EXECUTING.../;
22
23plan( @tests + 2 + ( @strs - grep { !$_ or /^---/ } @strs ));
24
25is( scalar @tests, $NUM_SECTS,
26    "Expecting output for $NUM_SECTS patterns, got ". scalar(@tests) );
27ok( defined $out, 'regop.pl returned something defined' );
28
29$out ||= "";
30my $test= 1;
31foreach my $testout ( @tests ) {
32    my ( $pattern )= $testout=~/Compiling REx "([^"]+)"/;
33    ok( $pattern, "Pattern for test " . ($test++) );
34    my $diaged;
35    while (@strs) {
36        local $_= shift @strs;
37        last if !$_
38             or /^---/;
39        next if /^\s*#/;
40        s/^\s+//;
41        s/\s+$//;
42        ok( $testout=~/\Q$_\E/, "$_: /$pattern/" )
43            or do {
44                !$diaged++ and diag("PATTERN: /$pattern/\n\n"
45		    . "EXPECTED:\n$_\n\n"
46		    . "WITHIN GOT:\n$testout");
47            };
48    }
49}
50
51# The format below is simple. Each line is an exact
52# string that must be found in the output.
53# Lines starting the # are comments.
54# Lines starting with --- are separators indicating
55# that the tests for this result set are finished.
56# If you add a test make sure you update $NUM_SECTS
57# the commented output is just for legacy/debugging purposes
58BEGIN{ $NUM_SECTS= 8 }
59
60__END__
61#Compiling REx "X(A|[B]Q||C|D)Y"
62#size 34
63#first at 1
64#   1: EXACT <X>(3)
65#   3: OPEN1(5)
66#   5:   TRIE-EXACT(21)
67#        [Words:5 Chars:5 Unique:5 States:6 Start-Class:A-D]
68#          <A>
69#          <BQ>
70#          <>
71#          <C>
72#          <D>
73#  21: CLOSE1(23)
74#  23: EXACT <Y>(25)
75#  25: END(0)
76#anchored "X" at 0 floating "Y" at 1..3 (checking floating) minlen 2
77#Guessing start of match, REx "X(A|[B]Q||C|D)Y" against "XY"...
78#Found floating substr "Y" at offset 1...
79#Found anchored substr "X" at offset 0...
80#Guessed: match at offset 0
81#Matching REx "X(A|[B]Q||C|D)Y" against "XY"
82#  Setting an EVAL scope, savestack=140
83#   0 <> <XY>              |  1:  EXACT <X>
84#   1 <X> <Y>              |  3:  OPEN1
85#   1 <X> <Y>              |  5:  TRIE-EXACT
86#                                 matched empty string...
87#   1 <X> <Y>              | 21:  CLOSE1
88#   1 <X> <Y>              | 23:  EXACT <Y>
89#   2 <XY> <>              | 25:  END
90#Match successful!
91#%MATCHED%
92#Freeing REx: "X(A|[B]Q||C|D)Y"
93Compiling REx "X(A|[B]Q||C|D)Y"
94[A-D]
95TRIE-EXACT
96<BQ>
97matched empty string
98Match successful!
99Found floating substr "Y" at offset 1 (rx_origin now 0)...
100Found anchored substr "X" at offset 0 (rx_origin now 0)...
101Successfully guessed: match at offset 0
102checking floating
103minlen 2
104S:1/6
105W:5
106L:0/2
107C:5/5
108%MATCHED%
109---
110#Compiling REx "[f][o][o][b][a][r]"
111#size 67
112#first at 1
113#   1: EXACT <foobar>(13)
114#  13: END(0)
115#anchored "foobar" at 0 (checking anchored isall) minlen 6
116#Guessing start of match, REx "[f][o][o][b][a][r]" against "foobar"...
117#Found anchored substr "foobar" at offset 0...
118#Guessed: match at offset 0
119#Freeing REx: "[f][o][o][b][a][r]"
120foobar
121checking anchored isall
122minlen 6
123anchored "foobar" at 0
124Successfully guessed: match at offset 0
125Compiling REx "[f][o][o][b][a][r]"
126Freeing REx: "[f][o][o][b][a][r]"
127%MATCHED%
128---
129#Compiling REx ".[XY]."
130#size 14
131#first at 1
132#   1: REG_ANY(2)
133#   2: ANYOF[XY](13)
134#  13: REG_ANY(14)
135#  14: END(0)
136#minlen 3
137#%FAILED%
138#Freeing REx: ".[XY]."
139%FAILED%
140minlen 3
141---
142# Compiling REx "(?:ABCP|ABCG|ABCE|ABCB|ABCA|ABCD)"
143# Got 164 bytes for offset annotations.
144#     TRIE(NATIVE): W:6 C:24 Uq:7 Min:4 Max:4
145#       Char : Match Base  Ofs     A   B   C   P   G   E   D
146#       State|---------------------------------------------------
147#       #   1|       @   7 + 0[    2   .   .   .   .   .   .]
148#       #   2|       @   7 + 1[    .   3   .   .   .   .   .]
149#       #   3|       @   7 + 2[    .   .   4   .   .   .   .]
150#       #   4|       @   A + 0[    9   8   0   5   6   7   A]
151#       #   5| W   1 @   0
152#       #   6| W   2 @   0
153#       #   7| W   3 @   0
154#       #   8| W   4 @   0
155#       #   9| W   5 @   0
156#       #   A| W   6 @   0
157#     word_info N:(prev,char)= 1:(0,1) 2:(0,1) 3:(0,1) 4:(0,1) 5:(0,1) 6:(0,1)
158# Final program:
159#    1: EXACT <ABC> (3)
160#    3: TRIEC-EXACT<S:4/10 W:6 L:1/1 C:24/7>[A-EGP] (20)
161#       <P>
162#       <G>
163#       <E>
164#       <B>
165#       <A>
166#       <D>
167#   20: END (0)
168# anchored "ABC" at 0 (checking anchored) minlen 4
169# Offsets: [20]
170# 	1:4[3] 3:4[15] 19:32[0] 20:34[0]
171# Guessing start of match in sv for REx "(?:ABCP|ABCG|ABCE|ABCB|ABCA|ABCD)" against "ABCD"
172# Found anchored substr "ABC" at offset 0...
173# Guessed: match at offset 0
174# Matching REx "(?:ABCP|ABCG|ABCE|ABCB|ABCA|ABCD)" against "ABCD"
175#    0 <> <ABCD>               |  1:EXACT <ABC>(3)
176#    3 <ABC> <D>               |  3:TRIEC-EXACT<S:4/10 W:6 L:1/1 C:24/7>[A-EGP](20)
177#    3 <ABC> <D>               |    State:    4 Accepted:    0 Charid:  7 CP:  44 After State:    a
178#    4 <ABCD> <>               |    State:    a Accepted:    1 Charid:  7 CP:   0 After State:    0
179#                                   got 1 possible matches
180#                                   TRIE matched word #6, continuing
181#    4 <ABCD> <>               | 20:  END(0)
182# Match successful!
183# %MATCHED%
184# Freeing REx: "(?:ABCP|ABCG|ABCE|ABCB|ABCA|ABCD)"
185%MATCHED%
186EXACT <ABC>
187TRIEC-EXACT
188[A-EGP]
189S:4/10
190W:6
191L:1/1
192C:24/7
193minlen 4
194(checking anchored)
195anchored "ABC" at 0
196---
197#Compiling REx "(\.COM|\.EXE|\.BAT|\.CMD|\.VBS|\.VBE|\.JS|\.JSE|\.WSF|\.WSH|\.pyo|\.pyc|\.pyw|\.py)$"
198#size 48 nodes first at 3
199#first at 3
200#rarest char
201# at 0
202#   1: OPEN1(3)
203#   3:   EXACTF <.>(5)
204#   5:   TRIE-EXACTF(45)
205#        [Start:2 Words:14 Chars:54 Unique:18 States:29 Minlen:2 Maxlen:3 Start-Class:BCEJPVWbcejpvw]
206#          <.COM>
207#          ...  yada yada ... (dmq)
208#          <.py>
209#  45: CLOSE1(47)
210#  47: EOL(48)
211#  48: END(0)
212#floating ""$ at 3..4 (checking floating) stclass "EXACTF <.>" minlen 3
213#Offsets: [48]
214#        1:1[1] 3:2[1] 5:2[81] 45:83[1] 47:84[1] 48:85[0]
215#Guessing start of match, REx "(\.COM|\.EXE|\.BAT|\.CMD|\.VBS|\.VBE|\.JS|\.JSE|\.WSF|\.WSH|..." against "D:dev/perl/ver/28321_/perl.exe"...
216#Found floating substr ""$ at offset 30...
217#Starting position does not contradict /^/m...
218#Does not contradict STCLASS...
219#Guessed: match at offset 26
220#Matching REx "(\.COM|\.EXE|\.BAT|\.CMD|\.VBS|\.VBE|\.JS|\.JSE|\.WSF|\.WSH|\.pyo|\.pyc|\.pyw|\.py)$..." against ".exe"
221#Matching stclass "EXACTF <.>" against ".exe"
222#  Setting an EVAL scope, savestack=140
223#  26 <21_/perl> <.exe>    |  1:  OPEN1
224#  26 <21_/perl> <.exe>    |  3:  EXACTF <.>
225#  27 <21_/perl.> <exe>    |  5:  TRIE-EXACTF
226#                                 only one match : #2 <.EXE>
227#  30 <21_/perl.exe> <>    | 45:    CLOSE1
228#  30 <21_/perl.exe> <>    | 47:    EOL
229#  30 <21_/perl.exe> <>    | 48:    END
230#Match successful!
231#POP STATE(1)
232#%MATCHED%
233#Freeing REx: "(\\.COM|\\.EXE|\\.BAT|\\.CMD|\\.VBS|\\.VBE|\\.JS|\\.JSE|\\."......
234%MATCHED%
235floating ""$ at 3..4 (checking floating)
236#1:1[1] 3:2[1] 5:2[64] 45:83[1] 47:84[1] 48:85[0]
237#stclass EXACTF <.> minlen 3
238#Found floating substr ""$ at offset 30...
239#Does not contradict STCLASS...
240#Guessed: match at offset 26
241#Matching stclass EXACTF <.> against ".exe"
242---
243#Compiling REx "[q]"
244#size 3 nodes Got 7 bytes for offset annotations.
245#first at 1
246#Final program:
247#   1: EXACT <q>(3)
248#   3: END(0)
249#anchored "q" at 0 (checking anchored isall) minlen 1
250#Offsets: [3]
251#        1:1[3] 3:4[0]
252#Guessing start of match, REx "[q]" against "q"...
253#Found anchored substr "q" at offset 0...
254#Guessed: match at offset 0
255#%MATCHED%
256#Freeing REx: "[q]"
257Got 7 bytes for offset annotations.
258Offsets: [3]
2591:1[3] 3:4[0]
260%MATCHED%
261Freeing REx: "[q]"
262---
263#Compiling REx "^(\S{1,9}):\s*(\d+)$"
264#Final program:
265#   1: SBOL (2)
266#   2: OPEN1 (4)
267#   4:   CURLY {1,9} (7)
268#   6:     NPOSIXD[\s] (0)
269#   7: CLOSE1 (9)
270#   9: EXACT <:> (11)
271#  11: STAR (13)
272#  12:   POSIXD[\s] (0)
273#  13: OPEN2 (15)
274#  15:   PLUS (17)
275#  16:     POSIXD[\d] (0)
276#  17: CLOSE2 (19)
277#  19: EOL (20)
278#  20: END (0)
279#Freeing REx: "^(\S{1,9}):\s*(\d+)$"
280%MATCHED%
281Freeing REx: "^(\S{1,9}):\s*(\d+)$"
282---
283#Compiling REx "(?(DEFINE)(?<foo>foo))(?(DEFINE)(?<bar>(?&foo)bar))(?(DEFINE"...
284#Got 532 bytes for offset annotations.
285study_chunk_recursed_count: 5
286#Final program:
287#   1: DEFINEP (3)
288#   3: IFTHEN (14)
289#   5:   OPEN1 'foo' (7)
290#   7:     EXACT <foo> (9)
291#   9:   CLOSE1 'foo' (14)
292#  11:   LONGJMP (13)
293#  13:   TAIL (14)
294#  14: DEFINEP (16)
295#  16: IFTHEN (30)
296#  18:   OPEN2 'bar' (20)
297#  20:     GOSUB1[-15] (23)
298#  23:     EXACT <bar> (25)
299#  25:   CLOSE2 'bar' (30)
300#  27:   LONGJMP (29)
301#  29:   TAIL (30)
302#  30: DEFINEP (32)
303#  32: IFTHEN (46)
304#  34:   OPEN3 'baz' (36)
305#  36:     GOSUB2[-18] (39)
306#  39:     EXACT <baz> (41)
307#  41:   CLOSE3 'baz' (46)
308#  43:   LONGJMP (45)
309#  45:   TAIL (46)
310#  46: DEFINEP (48)
311#  48: IFTHEN (62)
312#  50:   OPEN4 'bop' (52)
313#  52:     GOSUB3[-18] (55)
314#  55:     EXACT <bop> (57)
315#  57:   CLOSE4 'bop' (62)
316#  59:   LONGJMP (61)
317#  61:   TAIL (62)
318#  62: END (0)
319minlen 0
320#Offsets: [66]
321#        1:3[0] 3:10[0] 5:17[1] 7:18[3] 9:21[1] 11:21[0] 13:22[0] 14:25[0] 16:32[0] 18:39[1] 20:41[3] 23:47[3] 25:50[1] 27:50[0] 29:51[0] 30:54[0] 32:61[0] 34:68[1] 36:70[3] 39:76[3] 41:79[1] 43:79[0] 45:80[0] 46:83[0] 48:90[0] 50:97[1] 52:99[3] 55:105[3] 57:108[1] 59:108[0] 61:109[0] 62:110[0]
322#Matching REx "(?(DEFINE)(?<foo>foo))(?(DEFINE)(?<bar>(?&foo)bar))(?(DEFINE"... against ""
323#   0 <> <>                   |  1:DEFINEP(3)
324#   0 <> <>                   |  3:IFTHEN(14)
325#   0 <> <>                   | 14:DEFINEP(16)
326#   0 <> <>                   | 16:IFTHEN(30)
327#   0 <> <>                   | 30:DEFINEP(32)
328#   0 <> <>                   | 32:IFTHEN(46)
329#   0 <> <>                   | 46:DEFINEP(48)
330#   0 <> <>                   | 48:IFTHEN(62)
331#   0 <> <>                   | 62:END(0)
332#Match successful!
333%MATCHED%
334#Freeing REx: "(?(DEFINE)(?<foo>foo))(?(DEFINE)(?<bar>(?&foo)bar))(?(DEFINE"...
335