line |
stmt |
bran |
cond |
sub |
pod |
time |
code |
1
|
|
|
|
|
|
|
package App::Sets::Parser; |
2
|
|
|
|
|
|
|
$App::Sets::Parser::VERSION = '0.978'; |
3
|
|
|
|
|
|
|
|
4
|
|
|
|
|
|
|
|
5
|
3
|
|
|
3
|
|
22
|
use strict; |
|
3
|
|
|
|
|
8
|
|
|
3
|
|
|
|
|
97
|
|
6
|
3
|
|
|
3
|
|
17
|
use warnings; |
|
3
|
|
|
|
|
5
|
|
|
3
|
|
|
|
|
96
|
|
7
|
3
|
|
|
3
|
|
16
|
use Carp; |
|
3
|
|
|
|
|
5
|
|
|
3
|
|
|
|
|
195
|
|
8
|
3
|
|
|
3
|
|
19
|
use Log::Log4perl::Tiny qw< :easy :dead_if_first >; |
|
3
|
|
|
|
|
7
|
|
|
3
|
|
|
|
|
19
|
|
9
|
|
|
|
|
|
|
|
10
|
|
|
|
|
|
|
# ABSTRACT: parse input expressions of operations on sets |
11
|
|
|
|
|
|
|
|
12
|
|
|
|
|
|
|
|
13
|
|
|
|
|
|
|
sub parse { |
14
|
64
|
|
|
64
|
0
|
174
|
my ($string) = @_; |
15
|
64
|
|
|
|
|
179
|
my $retval = first($string, 0); |
16
|
64
|
50
|
|
|
|
182
|
my ($expression, $pos) = $retval ? @$retval : (undef, 0); |
17
|
64
|
50
|
|
|
|
283
|
return $expression if $pos == length $string; |
18
|
|
|
|
|
|
|
|
19
|
0
|
|
|
|
|
0
|
my $offending = substr $string, $pos; |
20
|
|
|
|
|
|
|
|
21
|
0
|
|
|
|
|
0
|
my ($spaces) = $offending =~ s{\A(\s+)}{}mxs; |
22
|
0
|
|
|
|
|
0
|
$pos += length $spaces; |
23
|
|
|
|
|
|
|
|
24
|
0
|
|
|
|
|
0
|
my $nchars = 23; |
25
|
0
|
0
|
|
|
|
0
|
$offending = substr($offending, 0, $nchars - 3) . '...' |
26
|
|
|
|
|
|
|
if length($offending) > $nchars; |
27
|
|
|
|
|
|
|
|
28
|
0
|
|
|
|
|
0
|
LOGDIE "parse error at char $pos --> $offending\n",; |
29
|
|
|
|
|
|
|
} ## end sub parse |
30
|
|
|
|
|
|
|
|
31
|
|
|
|
|
|
|
sub lrx_head { |
32
|
252
|
|
|
252
|
0
|
661
|
my $sequence = _sequence(@_); |
33
|
|
|
|
|
|
|
return sub { |
34
|
252
|
50
|
|
252
|
|
663
|
my $retval = $sequence->(@_) |
35
|
|
|
|
|
|
|
or return; |
36
|
252
|
|
|
|
|
460
|
my ($struct, $pos) = @$retval; |
37
|
252
|
|
|
|
|
393
|
my ($second, $first_tail) = @{$struct}[1, 3]; |
|
252
|
|
|
|
|
520
|
|
38
|
252
|
100
|
|
|
|
517
|
if (defined $first_tail->[0]) { |
39
|
64
|
|
|
|
|
95
|
my ($root, $parent) = @{$first_tail->[0]}; |
|
64
|
|
|
|
|
142
|
|
40
|
64
|
|
|
|
|
104
|
$parent->[1] = $second->[0]; |
41
|
64
|
|
|
|
|
159
|
$struct = $root; |
42
|
|
|
|
|
|
|
} |
43
|
|
|
|
|
|
|
else { |
44
|
188
|
|
|
|
|
275
|
$struct = $second->[0]; |
45
|
|
|
|
|
|
|
} |
46
|
252
|
|
|
|
|
1806
|
return [$struct, $pos]; |
47
|
|
|
|
|
|
|
} |
48
|
252
|
|
|
|
|
1383
|
} ## end sub lrx_head |
49
|
|
|
|
|
|
|
|
50
|
|
|
|
|
|
|
sub lrx_tail { |
51
|
316
|
|
|
316
|
0
|
699
|
my $sequence = _sequence('optws', _alternation(_sequence(@_), 'empty')); |
52
|
|
|
|
|
|
|
return sub { |
53
|
316
|
50
|
|
316
|
|
592
|
my $retval = $sequence->(@_) |
54
|
|
|
|
|
|
|
or return; |
55
|
316
|
|
|
|
|
593
|
my ($struct, $pos) = @$retval; |
56
|
316
|
|
|
|
|
506
|
$retval = $struct->[1]; |
57
|
316
|
100
|
|
|
|
770
|
if (!defined $retval->[0]) { |
58
|
252
|
|
|
|
|
406
|
$retval = undef; |
59
|
|
|
|
|
|
|
} |
60
|
|
|
|
|
|
|
else { # not empty |
61
|
64
|
|
|
|
|
116
|
my ($op, $second, $tail) = @{$retval->[0]}[0, 2, 4]; |
|
64
|
|
|
|
|
208
|
|
62
|
64
|
|
|
|
|
146
|
my $node = [$op->[0], undef, $second->[0]]; |
63
|
64
|
50
|
|
|
|
120
|
if (defined $tail->[0]) { |
64
|
0
|
|
|
|
|
0
|
my ($root, $parent) = @{$tail->[0]}; |
|
0
|
|
|
|
|
0
|
|
65
|
0
|
|
|
|
|
0
|
$parent->[1] = $node; # link leaf to parent node |
66
|
0
|
|
|
|
|
0
|
$retval = [$root, $node]; |
67
|
|
|
|
|
|
|
} |
68
|
|
|
|
|
|
|
else { |
69
|
64
|
|
|
|
|
139
|
$retval = [$node, $node]; |
70
|
|
|
|
|
|
|
} |
71
|
|
|
|
|
|
|
} ## end else [ if (!defined $retval->... |
72
|
316
|
|
|
|
|
3560
|
return [$retval, $pos]; |
73
|
|
|
|
|
|
|
} |
74
|
316
|
|
|
|
|
1732
|
} ## end sub lrx_tail |
75
|
|
|
|
|
|
|
|
76
|
|
|
|
|
|
|
sub first { |
77
|
64
|
|
|
64
|
0
|
210
|
return lrx_head(qw< optws second optws first_tail optws >)->(@_); |
78
|
|
|
|
|
|
|
} |
79
|
|
|
|
|
|
|
|
80
|
|
|
|
|
|
|
sub first_tail { |
81
|
80
|
|
|
80
|
0
|
437
|
return lrx_tail(qw< op_subtract optws second optws first_tail optws >) |
82
|
|
|
|
|
|
|
->(@_); |
83
|
|
|
|
|
|
|
} |
84
|
|
|
|
|
|
|
|
85
|
|
|
|
|
|
|
sub second { |
86
|
80
|
|
|
80
|
0
|
229
|
return lrx_head(qw< optws third optws second_tail optws >)->(@_); |
87
|
|
|
|
|
|
|
} |
88
|
|
|
|
|
|
|
|
89
|
|
|
|
|
|
|
sub second_tail { |
90
|
108
|
|
|
108
|
0
|
246
|
return lrx_tail(qw< op_union optws third optws second_tail optws >) |
91
|
|
|
|
|
|
|
->(@_); |
92
|
|
|
|
|
|
|
} |
93
|
|
|
|
|
|
|
|
94
|
|
|
|
|
|
|
sub third { |
95
|
108
|
|
|
108
|
0
|
351
|
return lrx_head(qw< optws fourth optws third_tail optws >)->(@_); |
96
|
|
|
|
|
|
|
} |
97
|
|
|
|
|
|
|
|
98
|
|
|
|
|
|
|
sub third_tail { |
99
|
128
|
|
|
128
|
0
|
356
|
return lrx_tail(qw< op_intersect optws fourth optws third_tail optws >) |
100
|
|
|
|
|
|
|
->(@_); |
101
|
|
|
|
|
|
|
} |
102
|
|
|
|
|
|
|
|
103
|
|
|
|
|
|
|
sub fourth { |
104
|
128
|
50
|
|
128
|
0
|
401
|
my $retval = _sequence( |
105
|
|
|
|
|
|
|
'optws', |
106
|
|
|
|
|
|
|
_alternation( |
107
|
|
|
|
|
|
|
_sequence(_string('('), qw< optws first optws >, _string(')')), |
108
|
|
|
|
|
|
|
'filename', |
109
|
|
|
|
|
|
|
), |
110
|
|
|
|
|
|
|
'optws' |
111
|
|
|
|
|
|
|
)->(@_) |
112
|
|
|
|
|
|
|
or return; |
113
|
128
|
|
|
|
|
1358
|
my ($struct, $pos) = @$retval; |
114
|
128
|
|
|
|
|
230
|
my $meat = $struct->[1]; |
115
|
128
|
50
|
|
|
|
275
|
if (ref($meat->[0])) { |
116
|
0
|
|
|
|
|
0
|
$retval = $meat->[0][2][0]; |
117
|
|
|
|
|
|
|
} |
118
|
|
|
|
|
|
|
else { |
119
|
128
|
|
|
|
|
207
|
$retval = $meat->[0]; |
120
|
|
|
|
|
|
|
} |
121
|
128
|
|
|
|
|
519
|
return [$retval, $pos]; |
122
|
|
|
|
|
|
|
} ## end sub fourth |
123
|
|
|
|
|
|
|
|
124
|
|
|
|
|
|
|
sub _op { |
125
|
316
|
|
|
316
|
|
1102
|
my ($regex, $retval, $string, $pos) = @_; |
126
|
316
|
|
|
|
|
627
|
pos($string) = $pos; |
127
|
316
|
100
|
|
|
|
11151
|
return unless $string =~ m{\G($regex)}cgmxs; |
128
|
64
|
|
|
|
|
378
|
return [$retval, pos($string)]; |
129
|
|
|
|
|
|
|
} ## end sub _op |
130
|
|
|
|
|
|
|
|
131
|
|
|
|
|
|
|
sub op_intersect { |
132
|
128
|
|
|
128
|
0
|
948
|
return _op(qr{(?:intersect|[iI&^])}, 'intersect', @_); |
133
|
|
|
|
|
|
|
} |
134
|
|
|
|
|
|
|
|
135
|
|
|
|
|
|
|
sub op_union { |
136
|
108
|
|
|
108
|
0
|
424
|
return _op(qr{(?:union|[uUvV|+])}, 'union', @_); |
137
|
|
|
|
|
|
|
} |
138
|
|
|
|
|
|
|
|
139
|
|
|
|
|
|
|
sub op_subtract { |
140
|
80
|
|
|
80
|
0
|
274
|
return _op(qr{(?:minus|less|[\\-])}, 'minus', @_); |
141
|
|
|
|
|
|
|
} |
142
|
|
|
|
|
|
|
|
143
|
|
|
|
|
|
|
sub filename { |
144
|
128
|
|
|
128
|
0
|
258
|
my ($string, $pos) = @_; |
145
|
128
|
|
|
|
|
594
|
DEBUG "filename() >$string< $pos"; |
146
|
128
|
|
|
|
|
2306
|
pos($string) = $pos; |
147
|
128
|
|
|
|
|
220
|
my $retval; |
148
|
128
|
50
|
|
|
|
2022
|
if (($retval) = $string =~ m{\G ' ( [^']+ ) '}cgmxs) { |
|
|
50
|
|
|
|
|
|
|
|
50
|
|
|
|
|
|
149
|
0
|
|
|
|
|
0
|
return [$retval, pos($string)]; |
150
|
|
|
|
|
|
|
} |
151
|
|
|
|
|
|
|
elsif (($retval) = $string =~ m{\G " ( (?: \\. | [^"])+ ) "}cgmxs) { |
152
|
0
|
|
|
|
|
0
|
$retval =~ s{\\(.)}{$1}gmxs; |
153
|
0
|
|
|
|
|
0
|
return [$retval, pos($string)]; |
154
|
|
|
|
|
|
|
} |
155
|
|
|
|
|
|
|
elsif (($retval) = $string =~ m{\G ( (?: \\. | [\w.-/])+ )}cgmxs) { |
156
|
128
|
|
|
|
|
851
|
$retval =~ s{\\(.)}{$1}gmxs; |
157
|
128
|
|
|
|
|
557
|
return [$retval, pos($string)]; |
158
|
|
|
|
|
|
|
} |
159
|
0
|
|
|
|
|
0
|
return; |
160
|
|
|
|
|
|
|
} ## end sub filename |
161
|
|
|
|
|
|
|
|
162
|
|
|
|
|
|
|
sub empty { |
163
|
252
|
|
|
252
|
0
|
525
|
my ($string, $pos) = @_; |
164
|
252
|
|
|
|
|
698
|
return [undef, $pos]; |
165
|
|
|
|
|
|
|
} |
166
|
|
|
|
|
|
|
|
167
|
|
|
|
|
|
|
sub is_empty { |
168
|
0
|
|
|
0
|
0
|
0
|
my ($struct) = @_; |
169
|
0
|
|
|
|
|
0
|
return @{$struct->[0]} > 0; |
|
0
|
|
|
|
|
0
|
|
170
|
|
|
|
|
|
|
} |
171
|
|
|
|
|
|
|
|
172
|
|
|
|
|
|
|
sub ws { |
173
|
0
|
|
|
0
|
0
|
0
|
my ($string, $pos) = @_; |
174
|
0
|
|
|
|
|
0
|
pos($string) = $pos; |
175
|
0
|
0
|
|
|
|
0
|
my ($retval) = $string =~ m{\G (\s+)}cgmxs |
176
|
|
|
|
|
|
|
or return; |
177
|
0
|
|
|
|
|
0
|
return [$retval, pos($string)]; |
178
|
|
|
|
|
|
|
} ## end sub ws |
179
|
|
|
|
|
|
|
|
180
|
|
|
|
|
|
|
sub optws { |
181
|
1520
|
|
|
1520
|
0
|
2536
|
my ($string, $pos) = @_; |
182
|
1520
|
|
|
|
|
3065
|
pos($string) = $pos; |
183
|
1520
|
|
|
|
|
6950
|
my ($retval) = $string =~ m{\G (\s*)}cgmxs; |
184
|
1520
|
|
100
|
|
|
5684
|
$retval = [$retval || '', pos($string)]; |
185
|
1520
|
|
|
|
|
3896
|
return $retval; |
186
|
|
|
|
|
|
|
} ## end sub optws |
187
|
|
|
|
|
|
|
|
188
|
|
|
|
|
|
|
sub _string { |
189
|
256
|
|
|
256
|
|
737
|
my ($target) = @_; |
190
|
256
|
|
|
|
|
428
|
my $len = length $target; |
191
|
|
|
|
|
|
|
return sub { |
192
|
128
|
|
|
128
|
|
251
|
my ($string, $pos) = @_; |
193
|
128
|
50
|
|
|
|
731
|
return unless substr($string, $pos, $len) eq $target; |
194
|
0
|
|
|
|
|
0
|
return [$target, $pos + $len]; |
195
|
|
|
|
|
|
|
} |
196
|
256
|
|
|
|
|
1204
|
} ## end sub _string |
197
|
|
|
|
|
|
|
|
198
|
|
|
|
|
|
|
sub _alternation { |
199
|
444
|
|
|
444
|
|
857
|
my @subs = _resolve(@_); |
200
|
|
|
|
|
|
|
return sub { |
201
|
444
|
|
|
444
|
|
743
|
my ($string, $pos) = @_; |
202
|
444
|
|
|
|
|
692
|
for my $sub (@subs) { |
203
|
824
|
|
100
|
|
|
1788
|
my $retval = $sub->($string, $pos) || next; |
204
|
444
|
|
|
|
|
1148
|
return $retval; |
205
|
|
|
|
|
|
|
} |
206
|
0
|
|
|
|
|
0
|
return; |
207
|
444
|
|
|
|
|
1829
|
}; |
208
|
|
|
|
|
|
|
} ## end sub _alternation |
209
|
|
|
|
|
|
|
|
210
|
|
|
|
|
|
|
sub _sequence { |
211
|
1140
|
|
|
1140
|
|
2002
|
my @subs = _resolve(@_); |
212
|
|
|
|
|
|
|
return sub { |
213
|
1140
|
|
|
1140
|
|
1936
|
my ($string, $pos) = @_; |
214
|
1140
|
|
|
|
|
1423
|
my @chunks; |
215
|
1140
|
|
|
|
|
1704
|
for my $sub (@subs) { |
216
|
3040
|
100
|
|
|
|
5810
|
my $chunk = $sub->($string, $pos) |
217
|
|
|
|
|
|
|
or return; |
218
|
2660
|
|
|
|
|
4538
|
push @chunks, $chunk; |
219
|
2660
|
|
|
|
|
4517
|
$pos = $chunk->[1]; |
220
|
|
|
|
|
|
|
} ## end for my $sub (@subs) |
221
|
760
|
|
|
|
|
2080
|
return [\@chunks, $pos]; |
222
|
1140
|
|
|
|
|
4829
|
}; |
223
|
|
|
|
|
|
|
} ## end sub _sequence |
224
|
|
|
|
|
|
|
|
225
|
|
|
|
|
|
|
sub _resolve { |
226
|
|
|
|
|
|
|
return |
227
|
1584
|
100
|
33
|
1584
|
|
2289
|
map { ref $_ ? $_ : __PACKAGE__->can($_) || LOGDIE "unknown $_" } @_; |
|
5700
|
|
|
|
|
18702
|
|
228
|
|
|
|
|
|
|
} |
229
|
|
|
|
|
|
|
|
230
|
|
|
|
|
|
|
1; |
231
|
|
|
|
|
|
|
|
232
|
|
|
|
|
|
|
__END__ |