line |
stmt |
bran |
cond |
sub |
pod |
time |
code |
1
|
|
|
|
|
|
|
package PPI::Token::_QuoteEngine; |
2
|
|
|
|
|
|
|
|
3
|
|
|
|
|
|
|
=pod |
4
|
|
|
|
|
|
|
|
5
|
|
|
|
|
|
|
=head1 NAME |
6
|
|
|
|
|
|
|
|
7
|
|
|
|
|
|
|
PPI::Token::_QuoteEngine - The PPI Quote Engine |
8
|
|
|
|
|
|
|
|
9
|
|
|
|
|
|
|
=head1 DESCRIPTION |
10
|
|
|
|
|
|
|
|
11
|
|
|
|
|
|
|
The C package is designed hold functionality |
12
|
|
|
|
|
|
|
for processing quotes and quote like operators, including regexes. |
13
|
|
|
|
|
|
|
These have special requirements in parsing. |
14
|
|
|
|
|
|
|
|
15
|
|
|
|
|
|
|
The C package itself provides various parsing |
16
|
|
|
|
|
|
|
methods, which the L, L and |
17
|
|
|
|
|
|
|
L can inherit from. In this sense, it serves |
18
|
|
|
|
|
|
|
as a base class. |
19
|
|
|
|
|
|
|
|
20
|
|
|
|
|
|
|
=head2 Using this class |
21
|
|
|
|
|
|
|
|
22
|
|
|
|
|
|
|
I<(Refers only to internal uses. This class does not provide a |
23
|
|
|
|
|
|
|
public interface)> |
24
|
|
|
|
|
|
|
|
25
|
|
|
|
|
|
|
To use these, you should initialize them as normal C<'$Class-Enew'>, |
26
|
|
|
|
|
|
|
and then call the 'fill' method, which will cause the specialised |
27
|
|
|
|
|
|
|
parser to scan forwards and parse the quote to its end point. |
28
|
|
|
|
|
|
|
|
29
|
|
|
|
|
|
|
If -Efill returns true, finalise the token. |
30
|
|
|
|
|
|
|
|
31
|
|
|
|
|
|
|
=cut |
32
|
|
|
|
|
|
|
|
33
|
65
|
|
|
65
|
|
383
|
use strict; |
|
65
|
|
|
|
|
114
|
|
|
65
|
|
|
|
|
1398
|
|
34
|
65
|
|
|
65
|
|
266
|
use Carp (); |
|
65
|
|
|
|
|
123
|
|
|
65
|
|
|
|
|
42952
|
|
35
|
|
|
|
|
|
|
|
36
|
|
|
|
|
|
|
our $VERSION = '1.276'; |
37
|
|
|
|
|
|
|
|
38
|
|
|
|
|
|
|
|
39
|
|
|
|
|
|
|
|
40
|
|
|
|
|
|
|
|
41
|
|
|
|
|
|
|
|
42
|
|
|
|
|
|
|
# Hook for the __TOKENIZER__on_char token call |
43
|
|
|
|
|
|
|
sub __TOKENIZER__on_char { |
44
|
15376
|
|
|
15376
|
|
21820
|
my $class = shift; |
45
|
15376
|
50
|
|
|
|
35210
|
my $t = $_[0]->{token} ? shift : return undef; |
46
|
|
|
|
|
|
|
|
47
|
|
|
|
|
|
|
# Call the fill method to process the quote |
48
|
15376
|
|
|
|
|
32385
|
my $rv = $t->{token}->_fill( $t ); |
49
|
15376
|
50
|
|
|
|
26946
|
return undef unless defined $rv; |
50
|
|
|
|
|
|
|
|
51
|
|
|
|
|
|
|
## Doesn't support "end of file" indicator |
52
|
|
|
|
|
|
|
|
53
|
|
|
|
|
|
|
# Finalize the token and return 0 to tell the tokenizer |
54
|
|
|
|
|
|
|
# to go to the next character. |
55
|
15376
|
|
|
|
|
35384
|
$t->_finalize_token; |
56
|
|
|
|
|
|
|
|
57
|
15376
|
|
|
|
|
35844
|
0; |
58
|
|
|
|
|
|
|
} |
59
|
|
|
|
|
|
|
|
60
|
|
|
|
|
|
|
|
61
|
|
|
|
|
|
|
|
62
|
|
|
|
|
|
|
|
63
|
|
|
|
|
|
|
|
64
|
|
|
|
|
|
|
##################################################################### |
65
|
|
|
|
|
|
|
# Optimised character processors, used for quotes |
66
|
|
|
|
|
|
|
# and quote like stuff, and accessible to the child classes |
67
|
|
|
|
|
|
|
|
68
|
|
|
|
|
|
|
# An outright scan, raw and fast. |
69
|
|
|
|
|
|
|
# Searches for a particular character, not escaped, loading in new |
70
|
|
|
|
|
|
|
# lines as needed. |
71
|
|
|
|
|
|
|
# When called, we start at the current position. |
72
|
|
|
|
|
|
|
# When leaving, the position should be set to the position |
73
|
|
|
|
|
|
|
# of the character, NOT the one after it. |
74
|
|
|
|
|
|
|
sub _scan_for_unescaped_character { |
75
|
14401
|
|
|
14401
|
|
17412
|
my $class = shift; |
76
|
14401
|
|
|
|
|
16539
|
my $t = shift; |
77
|
14401
|
50
|
|
|
|
28554
|
my $char = (length $_[0] == 1) ? quotemeta shift : return undef; |
78
|
|
|
|
|
|
|
|
79
|
|
|
|
|
|
|
# Create the search regex. |
80
|
|
|
|
|
|
|
# Same as above but with a negative look-behind assertion. |
81
|
14401
|
|
|
|
|
129544
|
my $search = qr/(.*?(?
|
82
|
|
|
|
|
|
|
|
83
|
14401
|
|
|
|
|
25839
|
my $string = ''; |
84
|
14401
|
|
|
|
|
27627
|
while ( exists $t->{line} ) { |
85
|
|
|
|
|
|
|
# Get the search area for the current line |
86
|
17128
|
|
|
|
|
34998
|
pos $t->{line} = $t->{line_cursor}; |
87
|
|
|
|
|
|
|
|
88
|
|
|
|
|
|
|
# Can we find a match on this line |
89
|
17128
|
100
|
|
|
|
170860
|
if ( $t->{line} =~ m/\G$search/gc ) { |
90
|
|
|
|
|
|
|
# Found the character on this line |
91
|
12707
|
|
|
|
|
31249
|
$t->{line_cursor} += length($1) - 1; |
92
|
12707
|
|
|
|
|
52371
|
return $string . $1; |
93
|
|
|
|
|
|
|
} |
94
|
|
|
|
|
|
|
|
95
|
|
|
|
|
|
|
# Load in the next line |
96
|
4421
|
|
|
|
|
10240
|
$string .= substr $t->{line}, $t->{line_cursor}; |
97
|
4421
|
|
|
|
|
8764
|
my $rv = $t->_fill_line('inscan'); |
98
|
4421
|
100
|
|
|
|
7398
|
if ( $rv ) { |
|
|
50
|
|
|
|
|
|
99
|
|
|
|
|
|
|
# Push to first character |
100
|
2727
|
|
|
|
|
5023
|
$t->{line_cursor} = 0; |
101
|
|
|
|
|
|
|
} elsif ( defined $rv ) { |
102
|
|
|
|
|
|
|
# We hit the End of File |
103
|
1694
|
|
|
|
|
5036
|
return \$string; |
104
|
|
|
|
|
|
|
} else { |
105
|
|
|
|
|
|
|
# Unexpected error |
106
|
0
|
|
|
|
|
0
|
return undef; |
107
|
|
|
|
|
|
|
} |
108
|
|
|
|
|
|
|
} |
109
|
|
|
|
|
|
|
|
110
|
|
|
|
|
|
|
# We shouldn't be able to get here |
111
|
0
|
|
|
|
|
0
|
return undef; |
112
|
|
|
|
|
|
|
} |
113
|
|
|
|
|
|
|
|
114
|
|
|
|
|
|
|
# Scan for a close braced, and take into account both escaping, |
115
|
|
|
|
|
|
|
# and open close bracket pairs in the string. When complete, the |
116
|
|
|
|
|
|
|
# method leaves the line cursor on the LAST character found. |
117
|
|
|
|
|
|
|
sub _scan_for_brace_character { |
118
|
1315
|
|
|
1315
|
|
1733
|
my $class = shift; |
119
|
1315
|
|
|
|
|
1700
|
my $t = shift; |
120
|
1315
|
50
|
|
|
|
4498
|
my $close_brace = $_[0] =~ /^(?:\>|\)|\}|\])$/ ? shift : Carp::confess(''); # return undef; |
121
|
1315
|
|
|
|
|
1840
|
my $open_brace = $close_brace; |
122
|
1315
|
|
|
|
|
2257
|
$open_brace =~ tr/\>\)\}\]/\<\(\{\[/; |
123
|
|
|
|
|
|
|
|
124
|
|
|
|
|
|
|
# Create the search string |
125
|
1315
|
|
|
|
|
2104
|
$close_brace = quotemeta $close_brace; |
126
|
1315
|
|
|
|
|
1677
|
$open_brace = quotemeta $open_brace; |
127
|
1315
|
|
|
|
|
12519
|
my $search = qr/\G(.*?(?
|
128
|
|
|
|
|
|
|
|
129
|
|
|
|
|
|
|
# Loop as long as we can get new lines |
130
|
1315
|
|
|
|
|
2422
|
my $string = ''; |
131
|
1315
|
|
|
|
|
1619
|
my $depth = 1; |
132
|
1315
|
|
|
|
|
3085
|
while ( exists $t->{line} ) { |
133
|
|
|
|
|
|
|
# Get the search area |
134
|
2459
|
|
|
|
|
4811
|
pos $t->{line} = $t->{line_cursor}; |
135
|
|
|
|
|
|
|
|
136
|
|
|
|
|
|
|
# Look for a match |
137
|
2459
|
100
|
|
|
|
14528
|
unless ( $t->{line} =~ /$search/gc ) { |
138
|
|
|
|
|
|
|
# Load in the next line |
139
|
700
|
|
|
|
|
1626
|
$string .= substr( $t->{line}, $t->{line_cursor} ); |
140
|
700
|
|
|
|
|
1405
|
my $rv = $t->_fill_line('inscan'); |
141
|
700
|
100
|
|
|
|
1287
|
if ( $rv ) { |
142
|
|
|
|
|
|
|
# Push to first character |
143
|
569
|
|
|
|
|
782
|
$t->{line_cursor} = 0; |
144
|
569
|
|
|
|
|
1003
|
next; |
145
|
|
|
|
|
|
|
} |
146
|
131
|
50
|
|
|
|
389
|
if ( defined $rv ) { |
147
|
|
|
|
|
|
|
# We hit the End of File |
148
|
131
|
|
|
|
|
435
|
return \$string; |
149
|
|
|
|
|
|
|
} |
150
|
|
|
|
|
|
|
|
151
|
|
|
|
|
|
|
# Unexpected error |
152
|
0
|
|
|
|
|
0
|
return undef; |
153
|
|
|
|
|
|
|
} |
154
|
|
|
|
|
|
|
|
155
|
|
|
|
|
|
|
# Add to the string |
156
|
1759
|
|
|
|
|
3902
|
$string .= $1; |
157
|
1759
|
|
|
|
|
2794
|
$t->{line_cursor} += length $1; |
158
|
|
|
|
|
|
|
|
159
|
|
|
|
|
|
|
# Alter the depth and continue if we aren't at the end |
160
|
1759
|
100
|
|
|
|
8195
|
$depth += ($1 =~ /$open_brace$/) ? 1 : -1 and next; |
|
|
100
|
|
|
|
|
|
161
|
|
|
|
|
|
|
|
162
|
|
|
|
|
|
|
# Rewind the cursor by one character ( cludgy hack ) |
163
|
1184
|
|
|
|
|
1918
|
$t->{line_cursor} -= 1; |
164
|
1184
|
|
|
|
|
4197
|
return $string; |
165
|
|
|
|
|
|
|
} |
166
|
|
|
|
|
|
|
|
167
|
|
|
|
|
|
|
# Returning the string as a reference indicates EOF |
168
|
0
|
|
|
|
|
0
|
\$string; |
169
|
|
|
|
|
|
|
} |
170
|
|
|
|
|
|
|
|
171
|
|
|
|
|
|
|
# Find all spaces and comments, up to, but not including |
172
|
|
|
|
|
|
|
# the first non-whitespace character. |
173
|
|
|
|
|
|
|
# |
174
|
|
|
|
|
|
|
# Although it doesn't return it, it leaves the cursor |
175
|
|
|
|
|
|
|
# on the character following the gap |
176
|
|
|
|
|
|
|
sub _scan_quote_like_operator_gap { |
177
|
665
|
|
|
665
|
|
925
|
my $t = $_[1]; |
178
|
|
|
|
|
|
|
|
179
|
665
|
|
|
|
|
921
|
my $string = ''; |
180
|
665
|
|
|
|
|
1320
|
while ( exists $t->{line} ) { |
181
|
|
|
|
|
|
|
# Get the search area for the current line |
182
|
735
|
|
|
|
|
1442
|
pos $t->{line} = $t->{line_cursor}; |
183
|
|
|
|
|
|
|
|
184
|
|
|
|
|
|
|
# Since this regex can match zero characters, it should always match |
185
|
735
|
50
|
|
|
|
2753
|
$t->{line} =~ /\G(\s*(?:\#.*)?)/gc or return undef; |
186
|
|
|
|
|
|
|
|
187
|
|
|
|
|
|
|
# Add the chars found to the string |
188
|
735
|
|
|
|
|
1530
|
$string .= $1; |
189
|
|
|
|
|
|
|
|
190
|
|
|
|
|
|
|
# Did we match the entire line? |
191
|
735
|
100
|
|
|
|
1865
|
unless ( $t->{line_cursor} + length $1 == length $t->{line} ) { |
192
|
|
|
|
|
|
|
# Partial line match, which means we are at |
193
|
|
|
|
|
|
|
# the end of the gap. Fix the cursor and return |
194
|
|
|
|
|
|
|
# the string. |
195
|
477
|
|
|
|
|
702
|
$t->{line_cursor} += length $1; |
196
|
477
|
|
|
|
|
1190
|
return $string; |
197
|
|
|
|
|
|
|
} |
198
|
|
|
|
|
|
|
|
199
|
|
|
|
|
|
|
# Load in the next line. |
200
|
|
|
|
|
|
|
# If we reach the EOF, $t->{line} gets deleted, |
201
|
|
|
|
|
|
|
# which is caught by the while. |
202
|
258
|
|
|
|
|
658
|
my $rv = $t->_fill_line('inscan'); |
203
|
258
|
100
|
|
|
|
771
|
if ( $rv ) { |
|
|
50
|
|
|
|
|
|
204
|
|
|
|
|
|
|
# Set the cursor to the first character |
205
|
70
|
|
|
|
|
152
|
$t->{line_cursor} = 0; |
206
|
|
|
|
|
|
|
} elsif ( defined $rv ) { |
207
|
|
|
|
|
|
|
# Returning the string as a reference indicates EOF |
208
|
188
|
|
|
|
|
432
|
return \$string; |
209
|
|
|
|
|
|
|
} else { |
210
|
0
|
|
|
|
|
|
return undef; |
211
|
|
|
|
|
|
|
} |
212
|
|
|
|
|
|
|
} |
213
|
|
|
|
|
|
|
|
214
|
|
|
|
|
|
|
# Shouldn't be able to get here |
215
|
0
|
|
|
|
|
|
return undef; |
216
|
|
|
|
|
|
|
} |
217
|
|
|
|
|
|
|
|
218
|
|
|
|
|
|
|
1; |
219
|
|
|
|
|
|
|
|
220
|
|
|
|
|
|
|
=pod |
221
|
|
|
|
|
|
|
|
222
|
|
|
|
|
|
|
=head1 SUPPORT |
223
|
|
|
|
|
|
|
|
224
|
|
|
|
|
|
|
See the L in the main module. |
225
|
|
|
|
|
|
|
|
226
|
|
|
|
|
|
|
=head1 AUTHOR |
227
|
|
|
|
|
|
|
|
228
|
|
|
|
|
|
|
Adam Kennedy Eadamk@cpan.orgE |
229
|
|
|
|
|
|
|
|
230
|
|
|
|
|
|
|
=head1 COPYRIGHT |
231
|
|
|
|
|
|
|
|
232
|
|
|
|
|
|
|
Copyright 2001 - 2011 Adam Kennedy. |
233
|
|
|
|
|
|
|
|
234
|
|
|
|
|
|
|
This program is free software; you can redistribute |
235
|
|
|
|
|
|
|
it and/or modify it under the same terms as Perl itself. |
236
|
|
|
|
|
|
|
|
237
|
|
|
|
|
|
|
The full text of the license can be found in the |
238
|
|
|
|
|
|
|
LICENSE file included with this module. |
239
|
|
|
|
|
|
|
|
240
|
|
|
|
|
|
|
=cut |