| line |
stmt |
bran |
cond |
sub |
pod |
time |
code |
|
1
|
|
|
|
|
|
|
package App::Sets::Parser; |
|
2
|
|
|
|
|
|
|
$App::Sets::Parser::VERSION = '0.978'; |
|
3
|
|
|
|
|
|
|
|
|
4
|
|
|
|
|
|
|
|
|
5
|
3
|
|
|
3
|
|
22
|
use strict; |
|
|
3
|
|
|
|
|
8
|
|
|
|
3
|
|
|
|
|
97
|
|
|
6
|
3
|
|
|
3
|
|
17
|
use warnings; |
|
|
3
|
|
|
|
|
5
|
|
|
|
3
|
|
|
|
|
96
|
|
|
7
|
3
|
|
|
3
|
|
16
|
use Carp; |
|
|
3
|
|
|
|
|
5
|
|
|
|
3
|
|
|
|
|
195
|
|
|
8
|
3
|
|
|
3
|
|
19
|
use Log::Log4perl::Tiny qw< :easy :dead_if_first >; |
|
|
3
|
|
|
|
|
7
|
|
|
|
3
|
|
|
|
|
19
|
|
|
9
|
|
|
|
|
|
|
|
|
10
|
|
|
|
|
|
|
# ABSTRACT: parse input expressions of operations on sets |
|
11
|
|
|
|
|
|
|
|
|
12
|
|
|
|
|
|
|
|
|
13
|
|
|
|
|
|
|
sub parse { |
|
14
|
64
|
|
|
64
|
0
|
174
|
my ($string) = @_; |
|
15
|
64
|
|
|
|
|
179
|
my $retval = first($string, 0); |
|
16
|
64
|
50
|
|
|
|
182
|
my ($expression, $pos) = $retval ? @$retval : (undef, 0); |
|
17
|
64
|
50
|
|
|
|
283
|
return $expression if $pos == length $string; |
|
18
|
|
|
|
|
|
|
|
|
19
|
0
|
|
|
|
|
0
|
my $offending = substr $string, $pos; |
|
20
|
|
|
|
|
|
|
|
|
21
|
0
|
|
|
|
|
0
|
my ($spaces) = $offending =~ s{\A(\s+)}{}mxs; |
|
22
|
0
|
|
|
|
|
0
|
$pos += length $spaces; |
|
23
|
|
|
|
|
|
|
|
|
24
|
0
|
|
|
|
|
0
|
my $nchars = 23; |
|
25
|
0
|
0
|
|
|
|
0
|
$offending = substr($offending, 0, $nchars - 3) . '...' |
|
26
|
|
|
|
|
|
|
if length($offending) > $nchars; |
|
27
|
|
|
|
|
|
|
|
|
28
|
0
|
|
|
|
|
0
|
LOGDIE "parse error at char $pos --> $offending\n",; |
|
29
|
|
|
|
|
|
|
} ## end sub parse |
|
30
|
|
|
|
|
|
|
|
|
31
|
|
|
|
|
|
|
sub lrx_head { |
|
32
|
252
|
|
|
252
|
0
|
661
|
my $sequence = _sequence(@_); |
|
33
|
|
|
|
|
|
|
return sub { |
|
34
|
252
|
50
|
|
252
|
|
663
|
my $retval = $sequence->(@_) |
|
35
|
|
|
|
|
|
|
or return; |
|
36
|
252
|
|
|
|
|
460
|
my ($struct, $pos) = @$retval; |
|
37
|
252
|
|
|
|
|
393
|
my ($second, $first_tail) = @{$struct}[1, 3]; |
|
|
252
|
|
|
|
|
520
|
|
|
38
|
252
|
100
|
|
|
|
517
|
if (defined $first_tail->[0]) { |
|
39
|
64
|
|
|
|
|
95
|
my ($root, $parent) = @{$first_tail->[0]}; |
|
|
64
|
|
|
|
|
142
|
|
|
40
|
64
|
|
|
|
|
104
|
$parent->[1] = $second->[0]; |
|
41
|
64
|
|
|
|
|
159
|
$struct = $root; |
|
42
|
|
|
|
|
|
|
} |
|
43
|
|
|
|
|
|
|
else { |
|
44
|
188
|
|
|
|
|
275
|
$struct = $second->[0]; |
|
45
|
|
|
|
|
|
|
} |
|
46
|
252
|
|
|
|
|
1806
|
return [$struct, $pos]; |
|
47
|
|
|
|
|
|
|
} |
|
48
|
252
|
|
|
|
|
1383
|
} ## end sub lrx_head |
|
49
|
|
|
|
|
|
|
|
|
50
|
|
|
|
|
|
|
sub lrx_tail { |
|
51
|
316
|
|
|
316
|
0
|
699
|
my $sequence = _sequence('optws', _alternation(_sequence(@_), 'empty')); |
|
52
|
|
|
|
|
|
|
return sub { |
|
53
|
316
|
50
|
|
316
|
|
592
|
my $retval = $sequence->(@_) |
|
54
|
|
|
|
|
|
|
or return; |
|
55
|
316
|
|
|
|
|
593
|
my ($struct, $pos) = @$retval; |
|
56
|
316
|
|
|
|
|
506
|
$retval = $struct->[1]; |
|
57
|
316
|
100
|
|
|
|
770
|
if (!defined $retval->[0]) { |
|
58
|
252
|
|
|
|
|
406
|
$retval = undef; |
|
59
|
|
|
|
|
|
|
} |
|
60
|
|
|
|
|
|
|
else { # not empty |
|
61
|
64
|
|
|
|
|
116
|
my ($op, $second, $tail) = @{$retval->[0]}[0, 2, 4]; |
|
|
64
|
|
|
|
|
208
|
|
|
62
|
64
|
|
|
|
|
146
|
my $node = [$op->[0], undef, $second->[0]]; |
|
63
|
64
|
50
|
|
|
|
120
|
if (defined $tail->[0]) { |
|
64
|
0
|
|
|
|
|
0
|
my ($root, $parent) = @{$tail->[0]}; |
|
|
0
|
|
|
|
|
0
|
|
|
65
|
0
|
|
|
|
|
0
|
$parent->[1] = $node; # link leaf to parent node |
|
66
|
0
|
|
|
|
|
0
|
$retval = [$root, $node]; |
|
67
|
|
|
|
|
|
|
} |
|
68
|
|
|
|
|
|
|
else { |
|
69
|
64
|
|
|
|
|
139
|
$retval = [$node, $node]; |
|
70
|
|
|
|
|
|
|
} |
|
71
|
|
|
|
|
|
|
} ## end else [ if (!defined $retval->... |
|
72
|
316
|
|
|
|
|
3560
|
return [$retval, $pos]; |
|
73
|
|
|
|
|
|
|
} |
|
74
|
316
|
|
|
|
|
1732
|
} ## end sub lrx_tail |
|
75
|
|
|
|
|
|
|
|
|
76
|
|
|
|
|
|
|
sub first { |
|
77
|
64
|
|
|
64
|
0
|
210
|
return lrx_head(qw< optws second optws first_tail optws >)->(@_); |
|
78
|
|
|
|
|
|
|
} |
|
79
|
|
|
|
|
|
|
|
|
80
|
|
|
|
|
|
|
sub first_tail { |
|
81
|
80
|
|
|
80
|
0
|
437
|
return lrx_tail(qw< op_subtract optws second optws first_tail optws >) |
|
82
|
|
|
|
|
|
|
->(@_); |
|
83
|
|
|
|
|
|
|
} |
|
84
|
|
|
|
|
|
|
|
|
85
|
|
|
|
|
|
|
sub second { |
|
86
|
80
|
|
|
80
|
0
|
229
|
return lrx_head(qw< optws third optws second_tail optws >)->(@_); |
|
87
|
|
|
|
|
|
|
} |
|
88
|
|
|
|
|
|
|
|
|
89
|
|
|
|
|
|
|
sub second_tail { |
|
90
|
108
|
|
|
108
|
0
|
246
|
return lrx_tail(qw< op_union optws third optws second_tail optws >) |
|
91
|
|
|
|
|
|
|
->(@_); |
|
92
|
|
|
|
|
|
|
} |
|
93
|
|
|
|
|
|
|
|
|
94
|
|
|
|
|
|
|
sub third { |
|
95
|
108
|
|
|
108
|
0
|
351
|
return lrx_head(qw< optws fourth optws third_tail optws >)->(@_); |
|
96
|
|
|
|
|
|
|
} |
|
97
|
|
|
|
|
|
|
|
|
98
|
|
|
|
|
|
|
sub third_tail { |
|
99
|
128
|
|
|
128
|
0
|
356
|
return lrx_tail(qw< op_intersect optws fourth optws third_tail optws >) |
|
100
|
|
|
|
|
|
|
->(@_); |
|
101
|
|
|
|
|
|
|
} |
|
102
|
|
|
|
|
|
|
|
|
103
|
|
|
|
|
|
|
sub fourth { |
|
104
|
128
|
50
|
|
128
|
0
|
401
|
my $retval = _sequence( |
|
105
|
|
|
|
|
|
|
'optws', |
|
106
|
|
|
|
|
|
|
_alternation( |
|
107
|
|
|
|
|
|
|
_sequence(_string('('), qw< optws first optws >, _string(')')), |
|
108
|
|
|
|
|
|
|
'filename', |
|
109
|
|
|
|
|
|
|
), |
|
110
|
|
|
|
|
|
|
'optws' |
|
111
|
|
|
|
|
|
|
)->(@_) |
|
112
|
|
|
|
|
|
|
or return; |
|
113
|
128
|
|
|
|
|
1358
|
my ($struct, $pos) = @$retval; |
|
114
|
128
|
|
|
|
|
230
|
my $meat = $struct->[1]; |
|
115
|
128
|
50
|
|
|
|
275
|
if (ref($meat->[0])) { |
|
116
|
0
|
|
|
|
|
0
|
$retval = $meat->[0][2][0]; |
|
117
|
|
|
|
|
|
|
} |
|
118
|
|
|
|
|
|
|
else { |
|
119
|
128
|
|
|
|
|
207
|
$retval = $meat->[0]; |
|
120
|
|
|
|
|
|
|
} |
|
121
|
128
|
|
|
|
|
519
|
return [$retval, $pos]; |
|
122
|
|
|
|
|
|
|
} ## end sub fourth |
|
123
|
|
|
|
|
|
|
|
|
124
|
|
|
|
|
|
|
sub _op { |
|
125
|
316
|
|
|
316
|
|
1102
|
my ($regex, $retval, $string, $pos) = @_; |
|
126
|
316
|
|
|
|
|
627
|
pos($string) = $pos; |
|
127
|
316
|
100
|
|
|
|
11151
|
return unless $string =~ m{\G($regex)}cgmxs; |
|
128
|
64
|
|
|
|
|
378
|
return [$retval, pos($string)]; |
|
129
|
|
|
|
|
|
|
} ## end sub _op |
|
130
|
|
|
|
|
|
|
|
|
131
|
|
|
|
|
|
|
sub op_intersect { |
|
132
|
128
|
|
|
128
|
0
|
948
|
return _op(qr{(?:intersect|[iI&^])}, 'intersect', @_); |
|
133
|
|
|
|
|
|
|
} |
|
134
|
|
|
|
|
|
|
|
|
135
|
|
|
|
|
|
|
sub op_union { |
|
136
|
108
|
|
|
108
|
0
|
424
|
return _op(qr{(?:union|[uUvV|+])}, 'union', @_); |
|
137
|
|
|
|
|
|
|
} |
|
138
|
|
|
|
|
|
|
|
|
139
|
|
|
|
|
|
|
sub op_subtract { |
|
140
|
80
|
|
|
80
|
0
|
274
|
return _op(qr{(?:minus|less|[\\-])}, 'minus', @_); |
|
141
|
|
|
|
|
|
|
} |
|
142
|
|
|
|
|
|
|
|
|
143
|
|
|
|
|
|
|
sub filename { |
|
144
|
128
|
|
|
128
|
0
|
258
|
my ($string, $pos) = @_; |
|
145
|
128
|
|
|
|
|
594
|
DEBUG "filename() >$string< $pos"; |
|
146
|
128
|
|
|
|
|
2306
|
pos($string) = $pos; |
|
147
|
128
|
|
|
|
|
220
|
my $retval; |
|
148
|
128
|
50
|
|
|
|
2022
|
if (($retval) = $string =~ m{\G ' ( [^']+ ) '}cgmxs) { |
|
|
|
50
|
|
|
|
|
|
|
|
|
50
|
|
|
|
|
|
|
149
|
0
|
|
|
|
|
0
|
return [$retval, pos($string)]; |
|
150
|
|
|
|
|
|
|
} |
|
151
|
|
|
|
|
|
|
elsif (($retval) = $string =~ m{\G " ( (?: \\. | [^"])+ ) "}cgmxs) { |
|
152
|
0
|
|
|
|
|
0
|
$retval =~ s{\\(.)}{$1}gmxs; |
|
153
|
0
|
|
|
|
|
0
|
return [$retval, pos($string)]; |
|
154
|
|
|
|
|
|
|
} |
|
155
|
|
|
|
|
|
|
elsif (($retval) = $string =~ m{\G ( (?: \\. | [\w.-/])+ )}cgmxs) { |
|
156
|
128
|
|
|
|
|
851
|
$retval =~ s{\\(.)}{$1}gmxs; |
|
157
|
128
|
|
|
|
|
557
|
return [$retval, pos($string)]; |
|
158
|
|
|
|
|
|
|
} |
|
159
|
0
|
|
|
|
|
0
|
return; |
|
160
|
|
|
|
|
|
|
} ## end sub filename |
|
161
|
|
|
|
|
|
|
|
|
162
|
|
|
|
|
|
|
sub empty { |
|
163
|
252
|
|
|
252
|
0
|
525
|
my ($string, $pos) = @_; |
|
164
|
252
|
|
|
|
|
698
|
return [undef, $pos]; |
|
165
|
|
|
|
|
|
|
} |
|
166
|
|
|
|
|
|
|
|
|
167
|
|
|
|
|
|
|
sub is_empty { |
|
168
|
0
|
|
|
0
|
0
|
0
|
my ($struct) = @_; |
|
169
|
0
|
|
|
|
|
0
|
return @{$struct->[0]} > 0; |
|
|
0
|
|
|
|
|
0
|
|
|
170
|
|
|
|
|
|
|
} |
|
171
|
|
|
|
|
|
|
|
|
172
|
|
|
|
|
|
|
sub ws { |
|
173
|
0
|
|
|
0
|
0
|
0
|
my ($string, $pos) = @_; |
|
174
|
0
|
|
|
|
|
0
|
pos($string) = $pos; |
|
175
|
0
|
0
|
|
|
|
0
|
my ($retval) = $string =~ m{\G (\s+)}cgmxs |
|
176
|
|
|
|
|
|
|
or return; |
|
177
|
0
|
|
|
|
|
0
|
return [$retval, pos($string)]; |
|
178
|
|
|
|
|
|
|
} ## end sub ws |
|
179
|
|
|
|
|
|
|
|
|
180
|
|
|
|
|
|
|
sub optws { |
|
181
|
1520
|
|
|
1520
|
0
|
2536
|
my ($string, $pos) = @_; |
|
182
|
1520
|
|
|
|
|
3065
|
pos($string) = $pos; |
|
183
|
1520
|
|
|
|
|
6950
|
my ($retval) = $string =~ m{\G (\s*)}cgmxs; |
|
184
|
1520
|
|
100
|
|
|
5684
|
$retval = [$retval || '', pos($string)]; |
|
185
|
1520
|
|
|
|
|
3896
|
return $retval; |
|
186
|
|
|
|
|
|
|
} ## end sub optws |
|
187
|
|
|
|
|
|
|
|
|
188
|
|
|
|
|
|
|
sub _string { |
|
189
|
256
|
|
|
256
|
|
737
|
my ($target) = @_; |
|
190
|
256
|
|
|
|
|
428
|
my $len = length $target; |
|
191
|
|
|
|
|
|
|
return sub { |
|
192
|
128
|
|
|
128
|
|
251
|
my ($string, $pos) = @_; |
|
193
|
128
|
50
|
|
|
|
731
|
return unless substr($string, $pos, $len) eq $target; |
|
194
|
0
|
|
|
|
|
0
|
return [$target, $pos + $len]; |
|
195
|
|
|
|
|
|
|
} |
|
196
|
256
|
|
|
|
|
1204
|
} ## end sub _string |
|
197
|
|
|
|
|
|
|
|
|
198
|
|
|
|
|
|
|
sub _alternation { |
|
199
|
444
|
|
|
444
|
|
857
|
my @subs = _resolve(@_); |
|
200
|
|
|
|
|
|
|
return sub { |
|
201
|
444
|
|
|
444
|
|
743
|
my ($string, $pos) = @_; |
|
202
|
444
|
|
|
|
|
692
|
for my $sub (@subs) { |
|
203
|
824
|
|
100
|
|
|
1788
|
my $retval = $sub->($string, $pos) || next; |
|
204
|
444
|
|
|
|
|
1148
|
return $retval; |
|
205
|
|
|
|
|
|
|
} |
|
206
|
0
|
|
|
|
|
0
|
return; |
|
207
|
444
|
|
|
|
|
1829
|
}; |
|
208
|
|
|
|
|
|
|
} ## end sub _alternation |
|
209
|
|
|
|
|
|
|
|
|
210
|
|
|
|
|
|
|
sub _sequence { |
|
211
|
1140
|
|
|
1140
|
|
2002
|
my @subs = _resolve(@_); |
|
212
|
|
|
|
|
|
|
return sub { |
|
213
|
1140
|
|
|
1140
|
|
1936
|
my ($string, $pos) = @_; |
|
214
|
1140
|
|
|
|
|
1423
|
my @chunks; |
|
215
|
1140
|
|
|
|
|
1704
|
for my $sub (@subs) { |
|
216
|
3040
|
100
|
|
|
|
5810
|
my $chunk = $sub->($string, $pos) |
|
217
|
|
|
|
|
|
|
or return; |
|
218
|
2660
|
|
|
|
|
4538
|
push @chunks, $chunk; |
|
219
|
2660
|
|
|
|
|
4517
|
$pos = $chunk->[1]; |
|
220
|
|
|
|
|
|
|
} ## end for my $sub (@subs) |
|
221
|
760
|
|
|
|
|
2080
|
return [\@chunks, $pos]; |
|
222
|
1140
|
|
|
|
|
4829
|
}; |
|
223
|
|
|
|
|
|
|
} ## end sub _sequence |
|
224
|
|
|
|
|
|
|
|
|
225
|
|
|
|
|
|
|
sub _resolve { |
|
226
|
|
|
|
|
|
|
return |
|
227
|
1584
|
100
|
33
|
1584
|
|
2289
|
map { ref $_ ? $_ : __PACKAGE__->can($_) || LOGDIE "unknown $_" } @_; |
|
|
5700
|
|
|
|
|
18702
|
|
|
228
|
|
|
|
|
|
|
} |
|
229
|
|
|
|
|
|
|
|
|
230
|
|
|
|
|
|
|
1; |
|
231
|
|
|
|
|
|
|
|
|
232
|
|
|
|
|
|
|
__END__ |