| line |
stmt |
bran |
cond |
sub |
pod |
time |
code |
|
1
|
|
|
|
|
|
|
# Copyright 2012 Jeffrey Kegler |
|
2
|
|
|
|
|
|
|
# This file is part of Marpa::PP. Marpa::PP is free software: you can |
|
3
|
|
|
|
|
|
|
# redistribute it and/or modify it under the terms of the GNU Lesser |
|
4
|
|
|
|
|
|
|
# General Public License as published by the Free Software Foundation, |
|
5
|
|
|
|
|
|
|
# either version 3 of the License, or (at your option) any later version. |
|
6
|
|
|
|
|
|
|
# |
|
7
|
|
|
|
|
|
|
# Marpa::PP is distributed in the hope that it will be useful, |
|
8
|
|
|
|
|
|
|
# but WITHOUT ANY WARRANTY; without even the implied warranty of |
|
9
|
|
|
|
|
|
|
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU |
|
10
|
|
|
|
|
|
|
# Lesser General Public License for more details. |
|
11
|
|
|
|
|
|
|
# |
|
12
|
|
|
|
|
|
|
# You should have received a copy of the GNU Lesser |
|
13
|
|
|
|
|
|
|
# General Public License along with Marpa::PP. If not, see |
|
14
|
|
|
|
|
|
|
# http://www.gnu.org/licenses/. |
|
15
|
|
|
|
|
|
|
|
|
16
|
|
|
|
|
|
|
package Marpa::PP::Recognizer; |
|
17
|
|
|
|
|
|
|
|
|
18
|
44
|
|
|
44
|
|
1555
|
use 5.010; |
|
|
44
|
|
|
|
|
162
|
|
|
|
44
|
|
|
|
|
2059
|
|
|
19
|
44
|
|
|
44
|
|
1177
|
use warnings; |
|
|
44
|
|
|
|
|
269
|
|
|
|
44
|
|
|
|
|
6298
|
|
|
20
|
|
|
|
|
|
|
|
|
21
|
|
|
|
|
|
|
no warnings ## no critic (TestingAndDebugging::ProhibitNoWarnings) |
|
22
|
44
|
|
|
44
|
|
459
|
'recursion'; |
|
|
44
|
|
|
|
|
97
|
|
|
|
44
|
|
|
|
|
2707
|
|
|
23
|
|
|
|
|
|
|
|
|
24
|
44
|
|
|
44
|
|
1054
|
use strict; |
|
|
44
|
|
|
|
|
108
|
|
|
|
44
|
|
|
|
|
8757
|
|
|
25
|
44
|
|
|
44
|
|
2981
|
use integer; |
|
|
44
|
|
|
|
|
103
|
|
|
|
44
|
|
|
|
|
390
|
|
|
26
|
|
|
|
|
|
|
|
|
27
|
44
|
|
|
44
|
|
1777
|
use English qw( -no_match_vars ); |
|
|
44
|
|
|
|
|
2049
|
|
|
|
44
|
|
|
|
|
451
|
|
|
28
|
|
|
|
|
|
|
|
|
29
|
44
|
|
|
44
|
|
33060
|
use vars qw($VERSION $STRING_VERSION); |
|
|
44
|
|
|
|
|
140
|
|
|
|
44
|
|
|
|
|
6107
|
|
|
30
|
|
|
|
|
|
|
$VERSION = '0.014000'; |
|
31
|
|
|
|
|
|
|
$STRING_VERSION = $VERSION; |
|
32
|
|
|
|
|
|
|
{ |
|
33
|
|
|
|
|
|
|
## no critic (BuiltinFunctions::ProhibitStringyEval) |
|
34
|
|
|
|
|
|
|
## no critic (ValuesAndExpressions::RequireConstantVersion) |
|
35
|
|
|
|
|
|
|
$VERSION = eval $VERSION; |
|
36
|
|
|
|
|
|
|
} |
|
37
|
|
|
|
|
|
|
|
|
38
|
|
|
|
|
|
|
BEGIN { |
|
39
|
44
|
|
|
44
|
|
113
|
my $structure = <<'END_OF_STRUCTURE'; |
|
40
|
|
|
|
|
|
|
|
|
41
|
|
|
|
|
|
|
:package=Marpa::PP::Internal::Earley_Set |
|
42
|
|
|
|
|
|
|
|
|
43
|
|
|
|
|
|
|
ORDINAL { The ordinal for this set } |
|
44
|
|
|
|
|
|
|
ITEMS { The Earley items for this set. } |
|
45
|
|
|
|
|
|
|
HASH { Hash by origin & state. To prevent dups. } |
|
46
|
|
|
|
|
|
|
POSTDOT { Index by postdot symbol. } |
|
47
|
|
|
|
|
|
|
|
|
48
|
|
|
|
|
|
|
END_OF_STRUCTURE |
|
49
|
44
|
|
|
|
|
236
|
Marpa::PP::offset($structure); |
|
50
|
|
|
|
|
|
|
} ## end BEGIN |
|
51
|
|
|
|
|
|
|
|
|
52
|
|
|
|
|
|
|
# Elements of the EARLEY ITEM structure |
|
53
|
|
|
|
|
|
|
# Note that these are Earley items as modified by Aycock & Horspool, |
|
54
|
|
|
|
|
|
|
# with AHFA states instead of |
|
55
|
|
|
|
|
|
|
# LR(0) items. |
|
56
|
|
|
|
|
|
|
|
|
57
|
|
|
|
|
|
|
# We don't prune the Earley items because we want ORIGIN and SET |
|
58
|
|
|
|
|
|
|
# around for debugging. |
|
59
|
|
|
|
|
|
|
|
|
60
|
|
|
|
|
|
|
BEGIN { |
|
61
|
44
|
|
|
44
|
|
117
|
my $structure = <<'END_OF_STRUCTURE'; |
|
62
|
|
|
|
|
|
|
|
|
63
|
|
|
|
|
|
|
:package=Marpa::PP::Internal::Earley_Item |
|
64
|
|
|
|
|
|
|
|
|
65
|
|
|
|
|
|
|
ID { ID of Earley item. Unique within recognizer. } |
|
66
|
|
|
|
|
|
|
STATE { The AHFA state. } |
|
67
|
|
|
|
|
|
|
LINKS { A list of the links from the completer step. } |
|
68
|
|
|
|
|
|
|
|
|
69
|
|
|
|
|
|
|
LEO_LINKS { Leo Links sources -- not necessarily unique. |
|
70
|
|
|
|
|
|
|
No more than one Leo link can come from a single |
|
71
|
|
|
|
|
|
|
Earleme. |
|
72
|
|
|
|
|
|
|
But the distance to the origin of this item can be |
|
73
|
|
|
|
|
|
|
"factored" differently between predecessor and cause. |
|
74
|
|
|
|
|
|
|
Each different "factoring" can contribute a Leo |
|
75
|
|
|
|
|
|
|
link. } |
|
76
|
|
|
|
|
|
|
IS_LEO_EXPANDED { Flag indicating if Leo links were expanded } |
|
77
|
|
|
|
|
|
|
|
|
78
|
|
|
|
|
|
|
ORIGIN { The number of the Earley set with the parent item(s) } |
|
79
|
|
|
|
|
|
|
SET { The set this item is in. For debugging. } |
|
80
|
|
|
|
|
|
|
|
|
81
|
|
|
|
|
|
|
END_OF_STRUCTURE |
|
82
|
44
|
|
|
|
|
306
|
Marpa::PP::offset($structure); |
|
83
|
|
|
|
|
|
|
} ## end BEGIN |
|
84
|
|
|
|
|
|
|
|
|
85
|
|
|
|
|
|
|
our $LEO_CLASS; |
|
86
|
|
|
|
|
|
|
$LEO_CLASS = 'Marpa::PP::Internal::Leo_Item'; |
|
87
|
|
|
|
|
|
|
|
|
88
|
|
|
|
|
|
|
BEGIN { |
|
89
|
44
|
|
|
44
|
|
117
|
my $structure = <<'END_OF_STRUCTURE'; |
|
90
|
|
|
|
|
|
|
|
|
91
|
|
|
|
|
|
|
:package=Marpa::PP::Internal::Leo_Item |
|
92
|
|
|
|
|
|
|
|
|
93
|
|
|
|
|
|
|
LEO_POSTDOT_SYMBOL { A symbol name. } |
|
94
|
|
|
|
|
|
|
ORIGIN { The number of the Earley set with the parent item(s) } |
|
95
|
|
|
|
|
|
|
BASE { The Earley item on which this item is based. } |
|
96
|
|
|
|
|
|
|
PREDECESSOR { The Leo item prior in the series to this one. } |
|
97
|
|
|
|
|
|
|
SET { The set this item is in. } |
|
98
|
|
|
|
|
|
|
TOP_TO_STATE { The AHFA to-state of the top-level transition. } |
|
99
|
|
|
|
|
|
|
|
|
100
|
|
|
|
|
|
|
END_OF_STRUCTURE |
|
101
|
44
|
|
|
|
|
180
|
Marpa::PP::offset($structure); |
|
102
|
|
|
|
|
|
|
} ## end BEGIN |
|
103
|
|
|
|
|
|
|
|
|
104
|
|
|
|
|
|
|
# Elements of the RECOGNIZER structure |
|
105
|
|
|
|
|
|
|
BEGIN { |
|
106
|
44
|
|
|
44
|
|
125
|
my $structure = <<'END_OF_STRUCTURE'; |
|
107
|
|
|
|
|
|
|
|
|
108
|
|
|
|
|
|
|
:package=Marpa::PP::Internal::Recognizer |
|
109
|
|
|
|
|
|
|
|
|
110
|
|
|
|
|
|
|
C { A C structure } |
|
111
|
|
|
|
|
|
|
|
|
112
|
|
|
|
|
|
|
GRAMMAR { the grammar used } |
|
113
|
|
|
|
|
|
|
EARLEY_SETS { the array of the Earley sets } |
|
114
|
|
|
|
|
|
|
NEXT_EARLEY_ITEM_ID { ID of the next Earley item to be created. } |
|
115
|
|
|
|
|
|
|
FURTHEST_EARLEME { last earley set with something in it } |
|
116
|
|
|
|
|
|
|
LAST_COMPLETED_EARLEME { the current earleme } |
|
117
|
|
|
|
|
|
|
FINISHED |
|
118
|
|
|
|
|
|
|
EXHAUSTED { can parse continue? } |
|
119
|
|
|
|
|
|
|
EXPECTED_TERMINALS { terminals which are expected at the |
|
120
|
|
|
|
|
|
|
current earleme } |
|
121
|
|
|
|
|
|
|
USE_LEO { Use Leo items? } |
|
122
|
|
|
|
|
|
|
NEXT_ORDINAL { Ordinal of next Earley set } |
|
123
|
|
|
|
|
|
|
EARLEY_SETS_BY_ORDINAL { Array of Earley sets by ordinal } |
|
124
|
|
|
|
|
|
|
|
|
125
|
|
|
|
|
|
|
TRACE_FILE_HANDLE |
|
126
|
|
|
|
|
|
|
|
|
127
|
|
|
|
|
|
|
END |
|
128
|
|
|
|
|
|
|
CLOSURES |
|
129
|
|
|
|
|
|
|
TRACE_ACTIONS |
|
130
|
|
|
|
|
|
|
TRACE_VALUES |
|
131
|
|
|
|
|
|
|
TRACE_TASKS |
|
132
|
|
|
|
|
|
|
TRACING |
|
133
|
|
|
|
|
|
|
MAX_PARSES |
|
134
|
|
|
|
|
|
|
NULL_VALUES |
|
135
|
|
|
|
|
|
|
RANKING_METHOD |
|
136
|
|
|
|
|
|
|
|
|
137
|
|
|
|
|
|
|
{ The following fields must be reinitialized when |
|
138
|
|
|
|
|
|
|
evaluation is reset } |
|
139
|
|
|
|
|
|
|
|
|
140
|
|
|
|
|
|
|
SINGLE_PARSE_MODE |
|
141
|
|
|
|
|
|
|
PARSE_COUNT :{ number of parses in an ambiguous parse :} |
|
142
|
|
|
|
|
|
|
|
|
143
|
|
|
|
|
|
|
AND_NODES |
|
144
|
|
|
|
|
|
|
AND_NODE_HASH |
|
145
|
|
|
|
|
|
|
OR_NODES |
|
146
|
|
|
|
|
|
|
OR_NODE_HASH |
|
147
|
|
|
|
|
|
|
|
|
148
|
|
|
|
|
|
|
ITERATION_STACK |
|
149
|
|
|
|
|
|
|
|
|
150
|
|
|
|
|
|
|
EVALUATOR_RULES |
|
151
|
|
|
|
|
|
|
|
|
152
|
|
|
|
|
|
|
{ This is the end of the list of fields which |
|
153
|
|
|
|
|
|
|
must be reinitialized when evaluation is reset } |
|
154
|
|
|
|
|
|
|
|
|
155
|
|
|
|
|
|
|
TOO_MANY_EARLEY_ITEMS |
|
156
|
|
|
|
|
|
|
TRACE_EARLEY_SETS |
|
157
|
|
|
|
|
|
|
TRACE_TERMINALS |
|
158
|
|
|
|
|
|
|
WARNINGS |
|
159
|
|
|
|
|
|
|
|
|
160
|
|
|
|
|
|
|
MODE |
|
161
|
|
|
|
|
|
|
|
|
162
|
|
|
|
|
|
|
END_OF_STRUCTURE |
|
163
|
44
|
|
|
|
|
198
|
Marpa::PP::offset($structure); |
|
164
|
|
|
|
|
|
|
} ## end BEGIN |
|
165
|
|
|
|
|
|
|
|
|
166
|
|
|
|
|
|
|
package Marpa::PP::Internal::Recognizer; |
|
167
|
|
|
|
|
|
|
|
|
168
|
44
|
|
|
44
|
|
475
|
use English qw( -no_match_vars ); |
|
|
44
|
|
|
|
|
4242
|
|
|
|
44
|
|
|
|
|
413
|
|
|
169
|
|
|
|
|
|
|
|
|
170
|
44
|
|
|
44
|
|
33645
|
use constant EARLEME_MASK => ~(0x7fffffff); |
|
|
44
|
|
|
|
|
99
|
|
|
|
44
|
|
|
|
|
4085
|
|
|
171
|
|
|
|
|
|
|
|
|
172
|
44
|
|
|
44
|
|
229
|
use constant DEFAULT_TOO_MANY_EARLEY_ITEMS => 100; |
|
|
44
|
|
|
|
|
95
|
|
|
|
44
|
|
|
|
|
71017
|
|
|
173
|
|
|
|
|
|
|
|
|
174
|
|
|
|
|
|
|
my $parse_number = 0; |
|
175
|
|
|
|
|
|
|
|
|
176
|
|
|
|
|
|
|
# Returns the new parse object or throws an exception |
|
177
|
|
|
|
|
|
|
sub Marpa::PP::Recognizer::new { |
|
178
|
188
|
|
|
188
|
1
|
104441
|
my ( $class, @arg_hashes ) = @_; |
|
179
|
188
|
|
|
|
|
1106
|
my $recce = bless [], 'Marpa::PP::Recognizer'; |
|
180
|
|
|
|
|
|
|
|
|
181
|
188
|
|
|
|
|
478
|
my $grammar; |
|
182
|
188
|
|
|
|
|
466
|
ARG_HASH: for my $arg_hash (@arg_hashes) { |
|
183
|
188
|
50
|
|
|
|
904
|
if ( defined( $grammar = $arg_hash->{grammar} ) ) { |
|
184
|
188
|
|
|
|
|
505
|
delete $arg_hash->{grammar}; |
|
185
|
188
|
|
|
|
|
526
|
last ARG_HASH; |
|
186
|
|
|
|
|
|
|
} |
|
187
|
|
|
|
|
|
|
} ## end for my $arg_hash (@arg_hashes) |
|
188
|
188
|
50
|
|
|
|
734
|
Marpa::PP::exception('No grammar specified') if not defined $grammar; |
|
189
|
|
|
|
|
|
|
|
|
190
|
188
|
|
|
|
|
932
|
$recce->[Marpa::PP::Internal::Recognizer::GRAMMAR] = $grammar; |
|
191
|
|
|
|
|
|
|
|
|
192
|
188
|
|
|
|
|
2613
|
my $grammar_class = ref $grammar; |
|
193
|
188
|
50
|
|
|
|
696
|
Marpa::PP::exception( |
|
194
|
|
|
|
|
|
|
"${class}::new() grammar arg has wrong class: $grammar_class") |
|
195
|
|
|
|
|
|
|
if not $grammar_class eq 'Marpa::PP::Grammar'; |
|
196
|
|
|
|
|
|
|
|
|
197
|
188
|
|
|
|
|
571
|
my $problems = $grammar->[Marpa::PP::Internal::Grammar::PROBLEMS]; |
|
198
|
188
|
50
|
|
|
|
561
|
if ($problems) { |
|
199
|
0
|
|
|
|
|
0
|
Marpa::PP::exception( |
|
200
|
|
|
|
|
|
|
Marpa::PP::Grammar::show_problems($grammar), |
|
201
|
|
|
|
|
|
|
"Attempt to parse grammar with fatal problems\n", |
|
202
|
|
|
|
|
|
|
'Marpa::PP cannot proceed', |
|
203
|
|
|
|
|
|
|
); |
|
204
|
|
|
|
|
|
|
} ## end if ($problems) |
|
205
|
|
|
|
|
|
|
|
|
206
|
188
|
|
|
|
|
553
|
my $phase = $grammar->[Marpa::PP::Internal::Grammar::PHASE]; |
|
207
|
188
|
50
|
|
|
|
611
|
if ( $phase != Marpa::PP::Internal::Phase::PRECOMPUTED ) { |
|
208
|
0
|
|
|
|
|
0
|
Marpa::PP::exception( |
|
209
|
|
|
|
|
|
|
'Attempt to parse grammar in inappropriate phase ', |
|
210
|
|
|
|
|
|
|
Marpa::PP::Internal::Phase::description($phase) |
|
211
|
|
|
|
|
|
|
); |
|
212
|
|
|
|
|
|
|
} ## end if ( $phase != Marpa::PP::Internal::Phase::PRECOMPUTED) |
|
213
|
|
|
|
|
|
|
|
|
214
|
|
|
|
|
|
|
# set the defaults |
|
215
|
188
|
|
|
|
|
1113
|
local $Marpa::PP::Internal::TRACE_FH = my $trace_fh = |
|
216
|
|
|
|
|
|
|
$recce->[Marpa::PP::Internal::Recognizer::TRACE_FILE_HANDLE] = |
|
217
|
|
|
|
|
|
|
$grammar->[Marpa::PP::Internal::Grammar::TRACE_FILE_HANDLE]; |
|
218
|
188
|
|
|
|
|
641
|
$recce->[Marpa::PP::Internal::Recognizer::WARNINGS] = 1; |
|
219
|
188
|
|
|
|
|
435
|
$recce->[Marpa::PP::Internal::Recognizer::MODE] = 'default'; |
|
220
|
188
|
|
|
|
|
408
|
$recce->[Marpa::PP::Internal::Recognizer::RANKING_METHOD] = 'none'; |
|
221
|
188
|
|
|
|
|
407
|
$recce->[Marpa::PP::Internal::Recognizer::USE_LEO] = 1; |
|
222
|
188
|
|
|
|
|
336
|
$recce->[Marpa::PP::Internal::Recognizer::MAX_PARSES] = 0; |
|
223
|
188
|
|
|
|
|
355
|
$recce->[Marpa::PP::Internal::Recognizer::NEXT_EARLEY_ITEM_ID] = 0; |
|
224
|
188
|
|
|
|
|
1600
|
$recce->reset_evaluation(); |
|
225
|
|
|
|
|
|
|
|
|
226
|
188
|
|
|
|
|
874
|
$recce->set(@arg_hashes); |
|
227
|
|
|
|
|
|
|
|
|
228
|
188
|
50
|
66
|
|
|
898
|
if ( $grammar->[Marpa::PP::Internal::Grammar::HAS_CYCLE] |
|
|
|
|
33
|
|
|
|
|
|
229
|
|
|
|
|
|
|
and $recce->[Marpa::PP::Internal::Recognizer::RANKING_METHOD] ne |
|
230
|
|
|
|
|
|
|
'none' |
|
231
|
|
|
|
|
|
|
and not $grammar->[Marpa::PP::Internal::Grammar::CYCLE_RANKING_ACTION] |
|
232
|
|
|
|
|
|
|
) |
|
233
|
|
|
|
|
|
|
{ |
|
234
|
0
|
|
|
|
|
0
|
Marpa::PP::exception( |
|
235
|
|
|
|
|
|
|
"The grammar cycles (is infinitely ambiguous)\n", |
|
236
|
|
|
|
|
|
|
" but it has no 'cycle_ranking_action'.\n", |
|
237
|
|
|
|
|
|
|
" Either rewrite the grammar to eliminate cycles\n", |
|
238
|
|
|
|
|
|
|
" or define a 'cycle ranking action'\n" |
|
239
|
|
|
|
|
|
|
); |
|
240
|
|
|
|
|
|
|
} ## end if ( $grammar->[Marpa::PP::Internal::Grammar::HAS_CYCLE...]) |
|
241
|
|
|
|
|
|
|
|
|
242
|
188
|
|
100
|
|
|
1081
|
my $trace_terminals = |
|
243
|
|
|
|
|
|
|
$recce->[Marpa::PP::Internal::Recognizer::TRACE_TERMINALS] // 0; |
|
244
|
188
|
|
50
|
|
|
1109
|
my $trace_tasks = $recce->[Marpa::PP::Internal::Recognizer::TRACE_TASKS] |
|
245
|
|
|
|
|
|
|
// 0; |
|
246
|
|
|
|
|
|
|
|
|
247
|
188
|
50
|
|
|
|
717
|
if (not defined |
|
248
|
|
|
|
|
|
|
$recce->[Marpa::PP::Internal::Recognizer::TOO_MANY_EARLEY_ITEMS] ) |
|
249
|
|
|
|
|
|
|
{ |
|
250
|
188
|
|
|
|
|
504
|
my $AHFA_size = |
|
251
|
188
|
|
|
|
|
1038
|
scalar @{ $grammar->[Marpa::PP::Internal::Grammar::AHFA] }; |
|
252
|
188
|
|
|
|
|
1317
|
$recce->[Marpa::PP::Internal::Recognizer::TOO_MANY_EARLEY_ITEMS] = |
|
253
|
|
|
|
|
|
|
List::Util::max( ( 2 * $AHFA_size ), |
|
254
|
|
|
|
|
|
|
Marpa::PP::Internal::Recognizer::DEFAULT_TOO_MANY_EARLEY_ITEMS ); |
|
255
|
|
|
|
|
|
|
} ## end if ( not defined $recce->[...]) |
|
256
|
|
|
|
|
|
|
|
|
257
|
|
|
|
|
|
|
# Some of this processing -- to find terminals and Leo symbols |
|
258
|
|
|
|
|
|
|
# by state -- should perhaps be done in the grammar. |
|
259
|
|
|
|
|
|
|
|
|
260
|
188
|
|
|
|
|
472
|
my $terminal_names = |
|
261
|
|
|
|
|
|
|
$grammar->[Marpa::PP::Internal::Grammar::TERMINAL_NAMES]; |
|
262
|
|
|
|
|
|
|
|
|
263
|
188
|
|
|
|
|
367
|
my $AHFA = $grammar->[Marpa::PP::Internal::Grammar::AHFA]; |
|
264
|
188
|
|
|
|
|
343
|
my $symbol_hash = $grammar->[Marpa::PP::Internal::Grammar::SYMBOL_HASH]; |
|
265
|
|
|
|
|
|
|
|
|
266
|
188
|
|
|
|
|
426
|
my @earley_items = (); |
|
267
|
|
|
|
|
|
|
|
|
268
|
188
|
|
|
|
|
405
|
my $start_states = $grammar->[Marpa::PP::Internal::Grammar::START_STATES]; |
|
269
|
188
|
|
|
|
|
405
|
my %postdot = (); |
|
270
|
|
|
|
|
|
|
|
|
271
|
188
|
|
|
|
|
341
|
for my $state ( @{$start_states} ) { |
|
|
188
|
|
|
|
|
497
|
|
|
272
|
375
|
|
|
|
|
714
|
my $state_id = $state->[Marpa::PP::Internal::AHFA::ID]; |
|
273
|
375
|
|
|
|
|
1523
|
my $name = sprintf |
|
274
|
|
|
|
|
|
|
'S%d@%d-%d', |
|
275
|
|
|
|
|
|
|
$state_id, 0, 0; |
|
276
|
|
|
|
|
|
|
|
|
277
|
375
|
|
|
|
|
666
|
my $item = []; |
|
278
|
375
|
|
|
|
|
965
|
$item->[Marpa::PP::Internal::Earley_Item::ID] = |
|
279
|
|
|
|
|
|
|
$recce->[Marpa::PP::Internal::Recognizer::NEXT_EARLEY_ITEM_ID]++; |
|
280
|
375
|
|
|
|
|
671
|
$item->[Marpa::PP::Internal::Earley_Item::STATE] = $state; |
|
281
|
375
|
|
|
|
|
892
|
$item->[Marpa::PP::Internal::Earley_Item::ORIGIN] = 0; |
|
282
|
375
|
|
|
|
|
707
|
$item->[Marpa::PP::Internal::Earley_Item::LINKS] = []; |
|
283
|
375
|
|
|
|
|
743
|
$item->[Marpa::PP::Internal::Earley_Item::SET] = 0; |
|
284
|
|
|
|
|
|
|
|
|
285
|
375
|
|
|
|
|
594
|
push @earley_items, $item; |
|
286
|
|
|
|
|
|
|
|
|
287
|
375
|
|
|
|
|
581
|
while ( my ( $transition_symbol, $to_states ) = |
|
|
2860
|
|
|
|
|
11097
|
|
|
288
|
|
|
|
|
|
|
each %{ $state->[Marpa::PP::Internal::AHFA::TRANSITION] } ) |
|
289
|
|
|
|
|
|
|
{ |
|
290
|
2485
|
|
|
|
|
2653
|
my @to_states = grep {ref} @{$to_states}; |
|
|
3918
|
|
|
|
|
8179
|
|
|
|
2485
|
|
|
|
|
4348
|
|
|
291
|
2485
|
|
|
|
|
2871
|
push @{ $postdot{$transition_symbol} }, $item; |
|
|
2485
|
|
|
|
|
13383
|
|
|
292
|
|
|
|
|
|
|
} ## end while ( my ( $transition_symbol, $to_states ) = each %{...}) |
|
293
|
|
|
|
|
|
|
|
|
294
|
|
|
|
|
|
|
} ## end for my $state ( @{$start_states} ) |
|
295
|
|
|
|
|
|
|
|
|
296
|
188
|
|
|
|
|
531
|
$recce->[Marpa::PP::Internal::Recognizer::GRAMMAR] = $grammar; |
|
297
|
188
|
|
|
|
|
618
|
my $earley_set = []; |
|
298
|
188
|
|
|
|
|
492
|
$earley_set->[Marpa::PP::Internal::Earley_Set::POSTDOT] = \%postdot; |
|
299
|
188
|
|
|
|
|
457
|
$earley_set->[Marpa::PP::Internal::Earley_Set::ITEMS] = \@earley_items; |
|
300
|
188
|
|
|
|
|
372
|
$earley_set->[Marpa::PP::Internal::Earley_Set::ORDINAL] = 0; |
|
301
|
188
|
|
|
|
|
502
|
$recce->[Marpa::PP::Internal::Recognizer::EARLEY_SETS] = [$earley_set]; |
|
302
|
|
|
|
|
|
|
|
|
303
|
188
|
|
|
|
|
367
|
$recce->[Marpa::PP::Internal::Recognizer::FURTHEST_EARLEME] = 0; |
|
304
|
188
|
|
|
|
|
367
|
$recce->[Marpa::PP::Internal::Recognizer::LAST_COMPLETED_EARLEME] = 0; |
|
305
|
188
|
|
|
|
|
378
|
$recce->[Marpa::PP::Internal::Recognizer::NEXT_ORDINAL] = 1; |
|
306
|
188
|
|
|
|
|
1461
|
$recce->[Marpa::PP::Internal::Recognizer::EARLEY_SETS_BY_ORDINAL]->[0] = |
|
307
|
|
|
|
|
|
|
$earley_set; |
|
308
|
|
|
|
|
|
|
|
|
309
|
188
|
|
|
|
|
1180
|
my @terminals_expected = grep { $terminal_names->{$_} } keys %postdot; |
|
|
2463
|
|
|
|
|
4043
|
|
|
310
|
188
|
|
|
|
|
583
|
$recce->[Marpa::PP::Internal::Recognizer::EXPECTED_TERMINALS] = |
|
311
|
|
|
|
|
|
|
\@terminals_expected; |
|
312
|
|
|
|
|
|
|
|
|
313
|
188
|
|
|
|
|
591
|
$recce->[Marpa::PP::Internal::Recognizer::EXHAUSTED] = |
|
314
|
|
|
|
|
|
|
scalar @terminals_expected <= 0; |
|
315
|
|
|
|
|
|
|
|
|
316
|
188
|
100
|
|
|
|
605
|
if ( $trace_terminals > 1 ) { |
|
317
|
1
|
|
|
|
|
4
|
for my $terminal ( sort @terminals_expected ) { |
|
318
|
3
|
50
|
|
|
|
5
|
say {$Marpa::PP::Internal::TRACE_FH} |
|
|
3
|
|
|
|
|
16
|
|
|
319
|
|
|
|
|
|
|
qq{Expecting "$terminal" at earleme 0} |
|
320
|
|
|
|
|
|
|
or Marpa::PP::exception("Cannot print: $ERRNO"); |
|
321
|
|
|
|
|
|
|
} |
|
322
|
|
|
|
|
|
|
} ## end if ( $trace_terminals > 1 ) |
|
323
|
|
|
|
|
|
|
|
|
324
|
188
|
|
|
|
|
1080
|
return $recce; |
|
325
|
|
|
|
|
|
|
} ## end sub Marpa::PP::Recognizer::new |
|
326
|
|
|
|
|
|
|
|
|
327
|
44
|
|
|
|
|
3353
|
use constant RECOGNIZER_OPTIONS => [ |
|
328
|
|
|
|
|
|
|
qw{ |
|
329
|
|
|
|
|
|
|
closures |
|
330
|
|
|
|
|
|
|
end |
|
331
|
|
|
|
|
|
|
leo |
|
332
|
|
|
|
|
|
|
max_parses |
|
333
|
|
|
|
|
|
|
mode |
|
334
|
|
|
|
|
|
|
ranking_method |
|
335
|
|
|
|
|
|
|
too_many_earley_items |
|
336
|
|
|
|
|
|
|
trace_actions |
|
337
|
|
|
|
|
|
|
trace_earley_sets |
|
338
|
|
|
|
|
|
|
trace_fh |
|
339
|
|
|
|
|
|
|
trace_file_handle |
|
340
|
|
|
|
|
|
|
trace_tasks |
|
341
|
|
|
|
|
|
|
trace_terminals |
|
342
|
|
|
|
|
|
|
trace_values |
|
343
|
|
|
|
|
|
|
warnings |
|
344
|
|
|
|
|
|
|
} |
|
345
|
44
|
|
|
44
|
|
2493
|
]; |
|
|
44
|
|
|
|
|
101
|
|
|
346
|
|
|
|
|
|
|
|
|
347
|
44
|
|
|
44
|
|
240
|
use constant RECOGNIZER_MODES => [qw(default stream)]; |
|
|
44
|
|
|
|
|
183
|
|
|
|
44
|
|
|
|
|
253134
|
|
|
348
|
|
|
|
|
|
|
|
|
349
|
|
|
|
|
|
|
sub Marpa::PP::Recognizer::reset_evaluation { |
|
350
|
249
|
|
|
249
|
0
|
17037
|
my ($recce) = @_; |
|
351
|
249
|
|
|
|
|
527
|
$recce->[Marpa::PP::Internal::Recognizer::PARSE_COUNT] = 0; |
|
352
|
249
|
|
|
|
|
527
|
$recce->[Marpa::PP::Internal::Recognizer::SINGLE_PARSE_MODE] = undef; |
|
353
|
249
|
|
|
|
|
641
|
$recce->[Marpa::PP::Internal::Recognizer::AND_NODES] = []; |
|
354
|
249
|
|
|
|
|
3496
|
$recce->[Marpa::PP::Internal::Recognizer::AND_NODE_HASH] = {}; |
|
355
|
249
|
|
|
|
|
573
|
$recce->[Marpa::PP::Internal::Recognizer::OR_NODES] = []; |
|
356
|
249
|
|
|
|
|
639
|
$recce->[Marpa::PP::Internal::Recognizer::OR_NODE_HASH] = {}; |
|
357
|
249
|
|
|
|
|
2790
|
$recce->[Marpa::PP::Internal::Recognizer::ITERATION_STACK] = []; |
|
358
|
249
|
|
|
|
|
939
|
$recce->[Marpa::PP::Internal::Recognizer::EVALUATOR_RULES] = []; |
|
359
|
249
|
|
|
|
|
787
|
return; |
|
360
|
|
|
|
|
|
|
} ## end sub Marpa::PP::Recognizer::reset_evaluation |
|
361
|
|
|
|
|
|
|
|
|
362
|
|
|
|
|
|
|
sub Marpa::PP::Recognizer::set { |
|
363
|
251
|
|
|
251
|
1
|
3433
|
my ( $recce, @arg_hashes ) = @_; |
|
364
|
|
|
|
|
|
|
|
|
365
|
|
|
|
|
|
|
# This may get changed below |
|
366
|
251
|
|
|
|
|
735
|
my $trace_fh = |
|
367
|
|
|
|
|
|
|
$recce->[Marpa::PP::Internal::Recognizer::TRACE_FILE_HANDLE]; |
|
368
|
|
|
|
|
|
|
|
|
369
|
251
|
|
|
|
|
734
|
for my $args (@arg_hashes) { |
|
370
|
|
|
|
|
|
|
|
|
371
|
251
|
|
|
|
|
1032
|
my $ref_type = ref $args; |
|
372
|
251
|
50
|
33
|
|
|
1984
|
if ( not $ref_type or $ref_type ne 'HASH' ) { |
|
373
|
0
|
|
0
|
|
|
0
|
Carp::croak( |
|
374
|
|
|
|
|
|
|
'Marpa::PP Recognizer expects args as ref to HASH, got ', |
|
375
|
|
|
|
|
|
|
( "ref to $ref_type" || 'non-reference' ), |
|
376
|
|
|
|
|
|
|
' instead' |
|
377
|
|
|
|
|
|
|
); |
|
378
|
|
|
|
|
|
|
} ## end if ( not $ref_type or $ref_type ne 'HASH' ) |
|
379
|
251
|
50
|
|
|
|
489
|
if (my @bad_options = |
|
|
191
|
|
|
|
|
1322
|
|
|
380
|
|
|
|
|
|
|
grep { |
|
381
|
251
|
|
|
|
|
1140
|
not $_ ~~ Marpa::PP::Internal::Recognizer::RECOGNIZER_OPTIONS |
|
382
|
|
|
|
|
|
|
} |
|
383
|
|
|
|
|
|
|
keys %{$args} |
|
384
|
|
|
|
|
|
|
) |
|
385
|
|
|
|
|
|
|
{ |
|
386
|
0
|
|
|
|
|
0
|
Carp::croak( 'Unknown option(s) for Marpa::PP Recognizer: ', |
|
387
|
|
|
|
|
|
|
join q{ }, @bad_options ); |
|
388
|
|
|
|
|
|
|
} ## end if ( my @bad_options = grep { not $_ ~~ ...}) |
|
389
|
|
|
|
|
|
|
|
|
390
|
251
|
100
|
|
|
|
1117
|
if ( defined( my $value = $args->{'leo'} ) ) { |
|
391
|
4
|
100
|
|
|
|
15
|
$recce->[Marpa::PP::Internal::Recognizer::USE_LEO] = |
|
392
|
|
|
|
|
|
|
$value ? 1 : 0; |
|
393
|
|
|
|
|
|
|
} |
|
394
|
|
|
|
|
|
|
|
|
395
|
251
|
100
|
|
|
|
923
|
if ( defined( my $value = $args->{'max_parses'} ) ) { |
|
396
|
66
|
|
|
|
|
157
|
$recce->[Marpa::PP::Internal::Recognizer::MAX_PARSES] = $value; |
|
397
|
|
|
|
|
|
|
} |
|
398
|
|
|
|
|
|
|
|
|
399
|
251
|
100
|
|
|
|
1171
|
if ( defined( my $value = $args->{'mode'} ) ) { |
|
400
|
18
|
50
|
|
|
|
87
|
if (not $value ~~ |
|
401
|
|
|
|
|
|
|
Marpa::PP::Internal::Recognizer::RECOGNIZER_MODES ) |
|
402
|
|
|
|
|
|
|
{ |
|
403
|
0
|
|
|
|
|
0
|
Carp::croak( 'Unknown mode for Marpa::PP Recognizer: ', |
|
404
|
|
|
|
|
|
|
$value ); |
|
405
|
|
|
|
|
|
|
} ## end if ( not $value ~~ ...) |
|
406
|
18
|
|
|
|
|
47
|
$recce->[Marpa::PP::Internal::Recognizer::MODE] = $value; |
|
407
|
|
|
|
|
|
|
} ## end if ( defined( my $value = $args->{'mode'} ) ) |
|
408
|
|
|
|
|
|
|
|
|
409
|
251
|
100
|
|
|
|
954
|
if ( defined( my $value = $args->{'ranking_method'} ) ) { |
|
410
|
7
|
50
|
|
|
|
28
|
Marpa::PP::exception(q{ranking_method no longer implemented}) |
|
411
|
|
|
|
|
|
|
if not $Marpa::PP::AUTHOR_TEST_ONLY; |
|
412
|
7
|
50
|
|
|
|
301
|
Marpa::PP::exception( |
|
413
|
|
|
|
|
|
|
q{ranking_method must be 'constant' or 'none'}) |
|
414
|
|
|
|
|
|
|
if not $value ~~ [qw(constant none)]; |
|
415
|
7
|
|
|
|
|
21
|
$recce->[Marpa::PP::Internal::Recognizer::RANKING_METHOD] = |
|
416
|
|
|
|
|
|
|
$value; |
|
417
|
|
|
|
|
|
|
} ## end if ( defined( my $value = $args->{'ranking_method'} ...)) |
|
418
|
|
|
|
|
|
|
|
|
419
|
251
|
100
|
|
|
|
841
|
if ( defined( my $value = $args->{'trace_fh'} ) ) { |
|
420
|
1
|
|
|
|
|
4
|
$trace_fh = |
|
421
|
|
|
|
|
|
|
$recce->[Marpa::PP::Internal::Recognizer::TRACE_FILE_HANDLE] = |
|
422
|
|
|
|
|
|
|
$value; |
|
423
|
|
|
|
|
|
|
} |
|
424
|
|
|
|
|
|
|
|
|
425
|
251
|
100
|
|
|
|
861
|
if ( defined( my $value = $args->{'trace_file_handle'} ) ) { |
|
426
|
4
|
|
|
|
|
12
|
$trace_fh = |
|
427
|
|
|
|
|
|
|
$recce->[Marpa::PP::Internal::Recognizer::TRACE_FILE_HANDLE] = |
|
428
|
|
|
|
|
|
|
$value; |
|
429
|
|
|
|
|
|
|
} |
|
430
|
|
|
|
|
|
|
|
|
431
|
251
|
50
|
|
|
|
870
|
if ( defined( my $value = $args->{'trace_actions'} ) ) { |
|
432
|
0
|
|
|
|
|
0
|
$recce->[Marpa::PP::Internal::Recognizer::TRACE_ACTIONS] = $value; |
|
433
|
|
|
|
|
|
|
## Do not allow setting this option in recognizer for single parse mode |
|
434
|
0
|
|
|
|
|
0
|
$recce->[Marpa::PP::Internal::Recognizer::SINGLE_PARSE_MODE] = 0; |
|
435
|
0
|
0
|
|
|
|
0
|
if ($value) { |
|
436
|
0
|
0
|
|
|
|
0
|
say {$trace_fh} 'Setting trace_actions option' |
|
|
0
|
|
|
|
|
0
|
|
|
437
|
|
|
|
|
|
|
or Marpa::PP::exception("Cannot print: $ERRNO"); |
|
438
|
0
|
|
|
|
|
0
|
$recce->[Marpa::PP::Internal::Recognizer::TRACING] = 1; |
|
439
|
|
|
|
|
|
|
} |
|
440
|
|
|
|
|
|
|
} ## end if ( defined( my $value = $args->{'trace_actions'} )) |
|
441
|
|
|
|
|
|
|
|
|
442
|
251
|
50
|
|
|
|
846
|
if ( defined( my $value = $args->{'trace_tasks'} ) ) { |
|
443
|
0
|
0
|
|
|
|
0
|
Marpa::PP::exception('trace_tasks must be set to a number >= 0') |
|
444
|
|
|
|
|
|
|
if $value !~ /\A\d+\z/xms; |
|
445
|
0
|
|
|
|
|
0
|
$recce->[Marpa::PP::Internal::Recognizer::TRACE_TASKS] = |
|
446
|
|
|
|
|
|
|
$value + 0; |
|
447
|
0
|
0
|
|
|
|
0
|
if ($value) { |
|
448
|
0
|
0
|
|
|
|
0
|
say {$trace_fh} "Setting trace_tasks option to $value" |
|
|
0
|
|
|
|
|
0
|
|
|
449
|
|
|
|
|
|
|
or Marpa::PP::exception("Cannot print: $ERRNO"); |
|
450
|
0
|
|
|
|
|
0
|
$recce->[Marpa::PP::Internal::Recognizer::TRACING] = 1; |
|
451
|
|
|
|
|
|
|
} |
|
452
|
|
|
|
|
|
|
} ## end if ( defined( my $value = $args->{'trace_tasks'} ) ) |
|
453
|
|
|
|
|
|
|
|
|
454
|
251
|
100
|
|
|
|
861
|
if ( defined( my $value = $args->{'trace_terminals'} ) ) { |
|
455
|
3
|
|
|
|
|
5
|
$recce->[Marpa::PP::Internal::Recognizer::TRACE_TERMINALS] = |
|
456
|
|
|
|
|
|
|
$value; |
|
457
|
3
|
50
|
|
|
|
9
|
if ($value) { |
|
458
|
3
|
50
|
|
|
|
4
|
say {$trace_fh} 'Setting trace_terminals option' |
|
|
3
|
|
|
|
|
23
|
|
|
459
|
|
|
|
|
|
|
or Marpa::PP::exception("Cannot print: $ERRNO"); |
|
460
|
3
|
|
|
|
|
5
|
$recce->[Marpa::PP::Internal::Recognizer::TRACING] = 1; |
|
461
|
|
|
|
|
|
|
} |
|
462
|
|
|
|
|
|
|
} ## end if ( defined( my $value = $args->{'trace_terminals'}...)) |
|
463
|
|
|
|
|
|
|
|
|
464
|
251
|
50
|
|
|
|
936
|
if ( defined( my $value = $args->{'trace_earley_sets'} ) ) { |
|
465
|
0
|
|
|
|
|
0
|
$recce->[Marpa::PP::Internal::Recognizer::TRACE_EARLEY_SETS] = |
|
466
|
|
|
|
|
|
|
$value; |
|
467
|
0
|
0
|
|
|
|
0
|
if ($value) { |
|
468
|
0
|
0
|
|
|
|
0
|
say {$trace_fh} 'Setting trace_earley_sets option' |
|
|
0
|
|
|
|
|
0
|
|
|
469
|
|
|
|
|
|
|
or Marpa::PP::exception("Cannot print: $ERRNO"); |
|
470
|
0
|
|
|
|
|
0
|
$recce->[Marpa::PP::Internal::Recognizer::TRACING] = 1; |
|
471
|
|
|
|
|
|
|
} |
|
472
|
|
|
|
|
|
|
} ## end if ( defined( my $value = $args->{'trace_earley_sets'...})) |
|
473
|
|
|
|
|
|
|
|
|
474
|
251
|
100
|
|
|
|
880
|
if ( defined( my $value = $args->{'trace_values'} ) ) { |
|
475
|
1
|
|
|
|
|
3
|
$recce->[Marpa::PP::Internal::Recognizer::TRACE_VALUES] = $value; |
|
476
|
|
|
|
|
|
|
## Do not allow setting this option in recognizer for single parse mode |
|
477
|
1
|
|
|
|
|
2
|
$recce->[Marpa::PP::Internal::Recognizer::SINGLE_PARSE_MODE] = 0; |
|
478
|
1
|
50
|
|
|
|
4
|
if ($value) { |
|
479
|
0
|
0
|
|
|
|
0
|
say {$trace_fh} 'Setting trace_values option' |
|
|
0
|
|
|
|
|
0
|
|
|
480
|
|
|
|
|
|
|
or Marpa::PP::exception("Cannot print: $ERRNO"); |
|
481
|
0
|
|
|
|
|
0
|
$recce->[Marpa::PP::Internal::Recognizer::TRACING] = 1; |
|
482
|
|
|
|
|
|
|
} |
|
483
|
|
|
|
|
|
|
} ## end if ( defined( my $value = $args->{'trace_values'} ) ) |
|
484
|
|
|
|
|
|
|
|
|
485
|
251
|
100
|
|
|
|
862
|
if ( defined( my $value = $args->{'end'} ) ) { |
|
486
|
|
|
|
|
|
|
|
|
487
|
|
|
|
|
|
|
# Not allowed once parsing is started |
|
488
|
57
|
50
|
|
|
|
191
|
if ( $recce->[Marpa::PP::Internal::Recognizer::PARSE_COUNT] > 0 ) |
|
489
|
|
|
|
|
|
|
{ |
|
490
|
0
|
|
|
|
|
0
|
Marpa::PP::exception( |
|
491
|
|
|
|
|
|
|
q{Cannot reset end once parsing has started}); |
|
492
|
|
|
|
|
|
|
} |
|
493
|
57
|
|
|
|
|
117
|
$recce->[Marpa::PP::Internal::Recognizer::END] = $value; |
|
494
|
|
|
|
|
|
|
## Do not allow setting this option in recognizer for single parse mode |
|
495
|
57
|
|
|
|
|
103
|
$recce->[Marpa::PP::Internal::Recognizer::SINGLE_PARSE_MODE] = 0; |
|
496
|
|
|
|
|
|
|
} ## end if ( defined( my $value = $args->{'end'} ) ) |
|
497
|
|
|
|
|
|
|
|
|
498
|
251
|
100
|
|
|
|
941
|
if ( defined( my $value = $args->{'closures'} ) ) { |
|
499
|
|
|
|
|
|
|
|
|
500
|
|
|
|
|
|
|
# Not allowed once parsing is started |
|
501
|
30
|
50
|
|
|
|
121
|
if ( $recce->[Marpa::PP::Internal::Recognizer::PARSE_COUNT] > 0 ) |
|
502
|
|
|
|
|
|
|
{ |
|
503
|
0
|
|
|
|
|
0
|
Marpa::PP::exception( |
|
504
|
|
|
|
|
|
|
q{Cannot reset end once parsing has started}); |
|
505
|
|
|
|
|
|
|
} |
|
506
|
30
|
|
|
|
|
71
|
my $closures = |
|
507
|
|
|
|
|
|
|
$recce->[Marpa::PP::Internal::Recognizer::CLOSURES] = $value; |
|
508
|
|
|
|
|
|
|
## Do not allow setting this option in recognizer for single parse mode |
|
509
|
30
|
|
|
|
|
48
|
$recce->[Marpa::PP::Internal::Recognizer::SINGLE_PARSE_MODE] = 0; |
|
510
|
30
|
|
|
|
|
56
|
while ( my ( $action, $closure ) = each %{$closures} ) { |
|
|
2576
|
|
|
|
|
6842
|
|
|
511
|
2546
|
50
|
|
|
|
5627
|
Marpa::PP::exception(qq{Bad closure for action "$action"}) |
|
512
|
|
|
|
|
|
|
if ref $closure ne 'CODE'; |
|
513
|
|
|
|
|
|
|
} |
|
514
|
|
|
|
|
|
|
} ## end if ( defined( my $value = $args->{'closures'} ) ) |
|
515
|
|
|
|
|
|
|
|
|
516
|
251
|
50
|
|
|
|
868
|
if ( defined( my $value = $args->{'warnings'} ) ) { |
|
517
|
0
|
|
|
|
|
0
|
$recce->[Marpa::PP::Internal::Recognizer::WARNINGS] = $value; |
|
518
|
|
|
|
|
|
|
} |
|
519
|
|
|
|
|
|
|
|
|
520
|
251
|
50
|
|
|
|
1234
|
if ( defined( my $value = $args->{'too_many_earley_items'} ) ) { |
|
521
|
0
|
|
|
|
|
0
|
$recce->[Marpa::PP::Internal::Recognizer::TOO_MANY_EARLEY_ITEMS] = |
|
522
|
|
|
|
|
|
|
$value; |
|
523
|
|
|
|
|
|
|
} |
|
524
|
|
|
|
|
|
|
|
|
525
|
|
|
|
|
|
|
} ## end for my $args (@arg_hashes) |
|
526
|
|
|
|
|
|
|
|
|
527
|
251
|
|
|
|
|
781
|
return 1; |
|
528
|
|
|
|
|
|
|
} ## end sub Marpa::PP::Recognizer::set |
|
529
|
|
|
|
|
|
|
|
|
530
|
|
|
|
|
|
|
# Not intended to be documented. |
|
531
|
|
|
|
|
|
|
# Returns the size of the last completed earley set. |
|
532
|
|
|
|
|
|
|
# For testing, especially that the Leo items |
|
533
|
|
|
|
|
|
|
# are doing their job. |
|
534
|
|
|
|
|
|
|
sub Marpa::PP::Recognizer::earley_set_size { |
|
535
|
165
|
|
|
165
|
0
|
741
|
my ( $recce, $ordinal ) = @_; |
|
536
|
165
|
|
|
|
|
271
|
my $earley_set = |
|
537
|
|
|
|
|
|
|
$recce->[Marpa::PP::Internal::Recognizer::EARLEY_SETS_BY_ORDINAL] |
|
538
|
|
|
|
|
|
|
->[$ordinal]; |
|
539
|
165
|
50
|
|
|
|
355
|
return if not defined $earley_set; |
|
540
|
165
|
|
|
|
|
195
|
return scalar @{ $earley_set->[Marpa::PP::Internal::Earley_Set::ITEMS] }; |
|
|
165
|
|
|
|
|
463
|
|
|
541
|
|
|
|
|
|
|
} ## end sub Marpa::PP::Recognizer::earley_set_size |
|
542
|
|
|
|
|
|
|
|
|
543
|
|
|
|
|
|
|
sub Marpa::PP::Recognizer::latest_earley_set { |
|
544
|
165
|
|
|
165
|
0
|
853
|
my ($recce) = @_; |
|
545
|
165
|
|
|
|
|
371
|
my $earleme = |
|
546
|
|
|
|
|
|
|
$recce->[Marpa::PP::Internal::Recognizer::LAST_COMPLETED_EARLEME]; |
|
547
|
165
|
|
|
|
|
202
|
while (1) { |
|
548
|
|
|
|
|
|
|
|
|
549
|
|
|
|
|
|
|
# Earley set has a defined ORDINAL, so this loop must terminate |
|
550
|
165
|
|
|
|
|
272
|
my $earley_set = |
|
551
|
|
|
|
|
|
|
$recce->[Marpa::PP::Internal::Recognizer::EARLEY_SETS] |
|
552
|
|
|
|
|
|
|
->[$earleme]; |
|
553
|
165
|
|
|
|
|
225
|
my $ordinal = $earley_set->[Marpa::PP::Internal::Earley_Set::ORDINAL]; |
|
554
|
165
|
50
|
|
|
|
771
|
return $ordinal if defined $ordinal; |
|
555
|
0
|
|
|
|
|
0
|
$earleme--; |
|
556
|
|
|
|
|
|
|
} ## end while (1) |
|
557
|
0
|
|
|
|
|
0
|
die 'Internal error: this line should not be reached'; |
|
558
|
|
|
|
|
|
|
} ## end sub Marpa::PP::Recognizer::latest_earley_set |
|
559
|
|
|
|
|
|
|
|
|
560
|
|
|
|
|
|
|
sub Marpa::PP::Recognizer::check_terminal { |
|
561
|
1
|
|
|
1
|
1
|
8
|
my ( $recce, $name ) = @_; |
|
562
|
1
|
|
|
|
|
2
|
my $grammar = $recce->[Marpa::PP::Internal::Recognizer::GRAMMAR]; |
|
563
|
1
|
|
|
|
|
6
|
return $grammar->check_terminal($name); |
|
564
|
|
|
|
|
|
|
} |
|
565
|
|
|
|
|
|
|
|
|
566
|
|
|
|
|
|
|
sub Marpa::PP::Recognizer::exhausted { |
|
567
|
10
|
|
|
10
|
0
|
73
|
return $_[0]->[Marpa::PP::Internal::Recognizer::EXHAUSTED]; |
|
568
|
|
|
|
|
|
|
} |
|
569
|
|
|
|
|
|
|
|
|
570
|
|
|
|
|
|
|
sub Marpa::PP::Recognizer::current_earleme { |
|
571
|
1014
|
|
|
1014
|
0
|
4360
|
return $_[0]->[Marpa::PP::Internal::Recognizer::LAST_COMPLETED_EARLEME]; |
|
572
|
|
|
|
|
|
|
} |
|
573
|
|
|
|
|
|
|
|
|
574
|
|
|
|
|
|
|
sub Marpa::PP::Recognizer::terminals_expected { |
|
575
|
425
|
|
|
425
|
1
|
1804
|
return $_[0]->[Marpa::PP::Internal::Recognizer::EXPECTED_TERMINALS]; |
|
576
|
|
|
|
|
|
|
} |
|
577
|
|
|
|
|
|
|
|
|
578
|
|
|
|
|
|
|
# Deprecated -- obsolete |
|
579
|
|
|
|
|
|
|
sub Marpa::PP::Recognizer::status { |
|
580
|
70
|
|
|
70
|
0
|
102
|
my ($recce) = @_; |
|
581
|
70
|
100
|
|
|
|
353
|
return ( $recce->current_earleme(), $recce->terminals_expected() ) |
|
582
|
|
|
|
|
|
|
if wantarray; |
|
583
|
1
|
|
|
|
|
6
|
return $recce->current_earleme(); |
|
584
|
|
|
|
|
|
|
|
|
585
|
|
|
|
|
|
|
} ## end sub Marpa::PP::Recognizer::status |
|
586
|
|
|
|
|
|
|
|
|
587
|
|
|
|
|
|
|
# Now useless and deprecated |
|
588
|
0
|
|
|
0
|
0
|
0
|
sub Marpa::PP::Recognizer::strip { return 1; } |
|
589
|
|
|
|
|
|
|
|
|
590
|
|
|
|
|
|
|
# Viewing methods, for debugging |
|
591
|
|
|
|
|
|
|
|
|
592
|
|
|
|
|
|
|
sub Marpa::PP::show_link_choice { |
|
593
|
272
|
|
|
272
|
0
|
333
|
my ($link) = @_; |
|
594
|
272
|
|
|
|
|
284
|
my ( $predecessor, $cause, $token_name, $value_ref ) = @{$link}; |
|
|
272
|
|
|
|
|
451
|
|
|
595
|
272
|
|
|
|
|
452
|
my @pieces = (); |
|
596
|
272
|
50
|
|
|
|
527
|
if ($predecessor) { |
|
597
|
272
|
|
|
|
|
491
|
push @pieces, |
|
598
|
|
|
|
|
|
|
'p=' . Marpa::PP::Internal::Earley_Item::name($predecessor); |
|
599
|
|
|
|
|
|
|
} |
|
600
|
272
|
100
|
|
|
|
859
|
if ( not defined $cause ) { |
|
601
|
70
|
|
|
|
|
122
|
push @pieces, "s=$token_name"; |
|
602
|
70
|
|
|
|
|
355
|
my $token_dump = Data::Dumper->new( [$value_ref] )->Terse(1)->Dump; |
|
603
|
70
|
|
|
|
|
4120
|
chomp $token_dump; |
|
604
|
70
|
|
|
|
|
162
|
push @pieces, "t=$token_dump"; |
|
605
|
|
|
|
|
|
|
} ## end if ( not defined $cause ) |
|
606
|
|
|
|
|
|
|
else { |
|
607
|
202
|
|
|
|
|
381
|
push @pieces, |
|
608
|
|
|
|
|
|
|
'c=' . Marpa::PP::Internal::Earley_Item::name( $link->[1] ); |
|
609
|
|
|
|
|
|
|
} |
|
610
|
272
|
|
|
|
|
1618
|
return '[' . ( join '; ', @pieces ) . ']'; |
|
611
|
|
|
|
|
|
|
} ## end sub Marpa::PP::show_link_choice |
|
612
|
|
|
|
|
|
|
|
|
613
|
|
|
|
|
|
|
sub Marpa::PP::show_leo_link_choice { |
|
614
|
47
|
|
|
47
|
0
|
64
|
my ( $recce, $leo_link ) = @_; |
|
615
|
47
|
|
|
|
|
54
|
my ( $leo_item, $cause ) = @{$leo_link}; |
|
|
47
|
|
|
|
|
74
|
|
|
616
|
47
|
|
|
|
|
113
|
my @link_texts = (); |
|
617
|
47
|
50
|
|
|
|
101
|
if ($leo_item) { |
|
618
|
47
|
|
|
|
|
103
|
push @link_texts, |
|
619
|
|
|
|
|
|
|
( 'l=' . Marpa::PP::leo_item_name( $recce, $leo_item ) ); |
|
620
|
|
|
|
|
|
|
} |
|
621
|
47
|
|
|
|
|
110
|
push @link_texts, 'c=' . Marpa::PP::Internal::Earley_Item::name($cause); |
|
622
|
47
|
|
|
|
|
295
|
return '[' . ( join '; ', @link_texts ) . ']'; |
|
623
|
|
|
|
|
|
|
} ## end sub Marpa::PP::show_leo_link_choice |
|
624
|
|
|
|
|
|
|
|
|
625
|
|
|
|
|
|
|
sub Marpa::PP::Internal::Earley_Item::name { |
|
626
|
1075
|
|
|
1075
|
|
1248
|
my ($item) = @_; |
|
627
|
1075
|
|
|
|
|
3914
|
return sprintf 'S%d@%d-%d', |
|
628
|
|
|
|
|
|
|
$item->[Marpa::PP::Internal::Earley_Item::STATE] |
|
629
|
|
|
|
|
|
|
->[Marpa::PP::Internal::AHFA::ID], |
|
630
|
|
|
|
|
|
|
$item->[Marpa::PP::Internal::Earley_Item::ORIGIN], |
|
631
|
|
|
|
|
|
|
$item->[Marpa::PP::Internal::Earley_Item::SET]; |
|
632
|
|
|
|
|
|
|
} ## end sub Marpa::PP::Internal::Earley_Item::name |
|
633
|
|
|
|
|
|
|
|
|
634
|
|
|
|
|
|
|
sub Marpa::PP::show_earley_item { |
|
635
|
351
|
|
|
351
|
0
|
470
|
my ( $recce, $item ) = @_; |
|
636
|
351
|
|
|
|
|
448
|
my $links = $item->[Marpa::PP::Internal::Earley_Item::LINKS]; |
|
637
|
351
|
|
|
|
|
425
|
my $leo_links = $item->[Marpa::PP::Internal::Earley_Item::LEO_LINKS]; |
|
638
|
351
|
|
|
|
|
423
|
my $grammar = $recce->[Marpa::PP::Internal::Recognizer::GRAMMAR]; |
|
639
|
351
|
|
|
|
|
408
|
my $symbol_hash = $grammar->[Marpa::PP::Internal::Grammar::SYMBOL_HASH]; |
|
640
|
|
|
|
|
|
|
|
|
641
|
351
|
|
|
|
|
550
|
my $text = Marpa::PP::Internal::Earley_Item::name($item); |
|
642
|
|
|
|
|
|
|
|
|
643
|
351
|
100
|
66
|
|
|
864
|
if ( defined $links and @{$links} ) { |
|
|
351
|
|
|
|
|
1189
|
|
|
644
|
242
|
|
|
|
|
286
|
my @sort_data; |
|
645
|
242
|
|
|
|
|
251
|
for my $link ( @{$links} ) { |
|
|
242
|
|
|
|
|
437
|
|
|
646
|
272
|
|
|
|
|
285
|
my ( $predecessor, $cause, $token_name, $value_ref ) = @{$link}; |
|
|
272
|
|
|
|
|
525
|
|
|
647
|
|
|
|
|
|
|
|
|
648
|
|
|
|
|
|
|
# The actual middle of a link with no predecessor |
|
649
|
|
|
|
|
|
|
# is the origin of the Earley item which contains this link, |
|
650
|
|
|
|
|
|
|
# but for sorting purposes any number less than than will do |
|
651
|
272
|
50
|
|
|
|
622
|
my $middle = |
|
652
|
|
|
|
|
|
|
defined $predecessor |
|
653
|
|
|
|
|
|
|
? $predecessor->[Marpa::PP::Internal::Earley_Item::SET] |
|
654
|
|
|
|
|
|
|
: -1; |
|
655
|
272
|
100
|
|
|
|
586
|
my $cause_state_id = |
|
656
|
|
|
|
|
|
|
defined $cause |
|
657
|
|
|
|
|
|
|
? $cause->[Marpa::PP::Internal::Earley_Item::STATE] |
|
658
|
|
|
|
|
|
|
->[Marpa::PP::Internal::AHFA::ID] |
|
659
|
|
|
|
|
|
|
: -1; |
|
660
|
272
|
100
|
|
|
|
592
|
my $symbol_id = |
|
661
|
|
|
|
|
|
|
defined $token_name ? $symbol_hash->{$token_name} : -1; |
|
662
|
272
|
|
|
|
|
1539
|
push @sort_data, |
|
663
|
|
|
|
|
|
|
[ |
|
664
|
|
|
|
|
|
|
$middle, $cause_state_id, |
|
665
|
|
|
|
|
|
|
$symbol_id, Marpa::PP::show_link_choice($link) |
|
666
|
|
|
|
|
|
|
]; |
|
667
|
|
|
|
|
|
|
} ## end for my $link ( @{$links} ) |
|
668
|
272
|
50
|
66
|
|
|
737
|
my @sorted_links = map { $_->[-1] } sort { |
|
|
30
|
|
|
|
|
186
|
|
|
669
|
242
|
|
|
|
|
506
|
$a->[0] <=> $b->[0] |
|
670
|
|
|
|
|
|
|
|| $a->[1] <=> $b->[1] |
|
671
|
|
|
|
|
|
|
|| $a->[2] <=> $b->[2] |
|
672
|
|
|
|
|
|
|
} @sort_data; |
|
673
|
242
|
|
|
|
|
828
|
$text .= q{ } . join q{ }, @sorted_links; |
|
674
|
|
|
|
|
|
|
} ## end if ( defined $links and @{$links} ) |
|
675
|
351
|
100
|
100
|
|
|
845
|
if ( defined $leo_links and @{$leo_links} ) { |
|
|
324
|
|
|
|
|
1055
|
|
|
676
|
38
|
|
|
|
|
50
|
my @sort_data; |
|
677
|
38
|
|
|
|
|
45
|
for my $link ( @{$leo_links} ) { |
|
|
38
|
|
|
|
|
76
|
|
|
678
|
47
|
|
|
|
|
55
|
my ( $predecessor, $cause ) = @{$link}; |
|
|
47
|
|
|
|
|
84
|
|
|
679
|
47
|
|
|
|
|
79
|
my $middle = $predecessor->[Marpa::PP::Internal::Leo_Item::SET]; |
|
680
|
47
|
|
|
|
|
74
|
my $cause_state_id = |
|
681
|
|
|
|
|
|
|
$cause->[Marpa::PP::Internal::Earley_Item::STATE] |
|
682
|
|
|
|
|
|
|
->[Marpa::PP::Internal::AHFA::ID]; |
|
683
|
47
|
|
|
|
|
70
|
my $symbol_name = $predecessor |
|
684
|
|
|
|
|
|
|
->[Marpa::PP::Internal::Leo_Item::LEO_POSTDOT_SYMBOL]; |
|
685
|
47
|
|
|
|
|
82
|
my $symbol_id = $symbol_hash->{$symbol_name}; |
|
686
|
47
|
|
|
|
|
104
|
push @sort_data, |
|
687
|
|
|
|
|
|
|
[ |
|
688
|
|
|
|
|
|
|
$middle, $cause_state_id, $symbol_id, |
|
689
|
|
|
|
|
|
|
Marpa::PP::show_leo_link_choice( $recce, $link ) |
|
690
|
|
|
|
|
|
|
]; |
|
691
|
|
|
|
|
|
|
} ## end for my $link ( @{$leo_links} ) |
|
692
|
47
|
50
|
66
|
|
|
129
|
my @sorted_links = map { $_->[-1] } sort { |
|
|
9
|
|
|
|
|
63
|
|
|
693
|
38
|
|
|
|
|
110
|
$a->[0] <=> $b->[0] |
|
694
|
|
|
|
|
|
|
|| $a->[1] <=> $b->[1] |
|
695
|
|
|
|
|
|
|
|| $a->[2] <=> $b->[2] |
|
696
|
|
|
|
|
|
|
} @sort_data; |
|
697
|
38
|
|
|
|
|
152
|
$text .= q{ } . join q{ }, @sorted_links; |
|
698
|
|
|
|
|
|
|
} ## end if ( defined $leo_links and @{$leo_links} ) |
|
699
|
351
|
|
|
|
|
1763
|
return $text; |
|
700
|
|
|
|
|
|
|
} ## end sub Marpa::PP::show_earley_item |
|
701
|
|
|
|
|
|
|
|
|
702
|
|
|
|
|
|
|
sub Marpa::PP::leo_item_name { |
|
703
|
444
|
|
|
444
|
0
|
513
|
my ( $recce, $item ) = @_; |
|
704
|
444
|
|
|
|
|
524
|
my $grammar = $recce->[Marpa::PP::Internal::Recognizer::GRAMMAR]; |
|
705
|
444
|
|
|
|
|
527
|
my $symbol_hash = $grammar->[Marpa::PP::Internal::Grammar::SYMBOL_HASH]; |
|
706
|
444
|
|
|
|
|
474
|
my $set = $item->[Marpa::PP::Internal::Leo_Item::SET]; |
|
707
|
444
|
|
|
|
|
598
|
my $symbol_name = |
|
708
|
|
|
|
|
|
|
$item->[Marpa::PP::Internal::Leo_Item::LEO_POSTDOT_SYMBOL]; |
|
709
|
444
|
|
|
|
|
635
|
my $symbol_id = $symbol_hash->{$symbol_name}; |
|
710
|
444
|
|
|
|
|
1484
|
return sprintf 'L%d@%d', $symbol_id, $set; |
|
711
|
|
|
|
|
|
|
} ## end sub Marpa::PP::leo_item_name |
|
712
|
|
|
|
|
|
|
|
|
713
|
|
|
|
|
|
|
sub Marpa::PP::show_leo_item { |
|
714
|
203
|
|
|
203
|
0
|
260
|
my ( $recce, $item ) = @_; |
|
715
|
203
|
|
|
|
|
266
|
my $base = $item->[Marpa::PP::Internal::Leo_Item::BASE]; |
|
716
|
203
|
|
|
|
|
239
|
my $predecessor = $item->[Marpa::PP::Internal::Leo_Item::PREDECESSOR]; |
|
717
|
203
|
|
|
|
|
232
|
my $leo_symbol_name = |
|
718
|
|
|
|
|
|
|
$item->[Marpa::PP::Internal::Leo_Item::LEO_POSTDOT_SYMBOL]; |
|
719
|
|
|
|
|
|
|
|
|
720
|
203
|
|
|
|
|
330
|
my $text = Marpa::PP::leo_item_name( $recce, $item ); |
|
721
|
203
|
|
|
|
|
470
|
my @link_texts = qq{"$leo_symbol_name"}; |
|
722
|
203
|
100
|
|
|
|
451
|
if ($predecessor) { |
|
723
|
194
|
|
|
|
|
328
|
push @link_texts, Marpa::PP::leo_item_name( $recce, $predecessor ); |
|
724
|
|
|
|
|
|
|
} |
|
725
|
203
|
|
|
|
|
375
|
push @link_texts, Marpa::PP::Internal::Earley_Item::name($base); |
|
726
|
203
|
|
|
|
|
549
|
$text .= ' [' . ( join '; ', @link_texts ) . ']'; |
|
727
|
203
|
|
|
|
|
848
|
return $text; |
|
728
|
|
|
|
|
|
|
} ## end sub Marpa::PP::show_leo_item |
|
729
|
|
|
|
|
|
|
|
|
730
|
|
|
|
|
|
|
sub Marpa::PP::show_earley_set { |
|
731
|
79
|
|
|
79
|
0
|
101
|
my ( $recce, $earley_set ) = @_; |
|
732
|
79
|
|
|
|
|
114
|
my $text = q{}; |
|
733
|
79
|
|
|
|
|
127
|
my $items = $earley_set->[Marpa::PP::Internal::Earley_Set::ITEMS]; |
|
734
|
351
|
50
|
|
|
|
648
|
my @sorted_descriptions = map { $_->[-1] } |
|
|
451
|
|
|
|
|
1021
|
|
|
735
|
351
|
|
|
|
|
925
|
sort { $a->[0] <=> $b->[0] || $a->[1] <=> $b->[1] } |
|
736
|
|
|
|
|
|
|
map { |
|
737
|
79
|
|
|
|
|
173
|
[ $_->[Marpa::PP::Internal::Earley_Item::ORIGIN], |
|
738
|
|
|
|
|
|
|
$_->[Marpa::PP::Internal::Earley_Item::STATE] |
|
739
|
|
|
|
|
|
|
->[Marpa::PP::Internal::AHFA::ID], |
|
740
|
|
|
|
|
|
|
Marpa::PP::show_earley_item( $recce, $_ ) . "\n" |
|
741
|
|
|
|
|
|
|
] |
|
742
|
79
|
|
|
|
|
115
|
} @{$items}; |
|
743
|
79
|
|
|
|
|
538
|
return join q{}, @sorted_descriptions; |
|
744
|
|
|
|
|
|
|
} ## end sub Marpa::PP::show_earley_set |
|
745
|
|
|
|
|
|
|
|
|
746
|
|
|
|
|
|
|
sub Marpa::PP::show_postdot_set { |
|
747
|
79
|
|
|
79
|
0
|
119
|
my ( $recce, $postdot_set ) = @_; |
|
748
|
79
|
|
|
|
|
112
|
my $grammar = $recce->[Marpa::PP::Internal::Recognizer::GRAMMAR]; |
|
749
|
79
|
|
|
|
|
106
|
my $symbol_hash = $grammar->[Marpa::PP::Internal::Grammar::SYMBOL_HASH]; |
|
750
|
79
|
|
|
|
|
97
|
my $text = q{}; |
|
751
|
79
|
|
|
|
|
116
|
my @decorated_leo_items = (); |
|
752
|
79
|
|
|
|
|
101
|
for my $leo_item ( |
|
|
620
|
|
|
|
|
1234
|
|
|
753
|
383
|
|
|
|
|
733
|
grep { ref eq $LEO_CLASS } |
|
754
|
383
|
|
|
|
|
367
|
map { @{$_} } values %{$postdot_set} |
|
|
79
|
|
|
|
|
204
|
|
|
755
|
|
|
|
|
|
|
) |
|
756
|
|
|
|
|
|
|
{ |
|
757
|
203
|
|
|
|
|
295
|
my $symbol_name = |
|
758
|
|
|
|
|
|
|
$leo_item->[Marpa::PP::Internal::Leo_Item::LEO_POSTDOT_SYMBOL]; |
|
759
|
203
|
|
|
|
|
285
|
my $symbol_id = $symbol_hash->{$symbol_name}; |
|
760
|
203
|
|
|
|
|
525
|
push @decorated_leo_items, [ $leo_item, $symbol_id ]; |
|
761
|
|
|
|
|
|
|
} ## end for my $leo_item ( grep { ref eq $LEO_CLASS } map { @...}) |
|
762
|
203
|
|
|
|
|
339
|
my @sorted_leo_items = |
|
763
|
79
|
|
|
|
|
214
|
map { $_->[0] } sort { $a->[1] <=> $b->[1] } @decorated_leo_items; |
|
|
402
|
|
|
|
|
489
|
|
|
764
|
79
|
|
|
|
|
147
|
for my $postdot_item (@sorted_leo_items) { |
|
765
|
203
|
|
|
|
|
376
|
$text .= Marpa::PP::show_leo_item( $recce, $postdot_item ) . "\n"; |
|
766
|
|
|
|
|
|
|
} |
|
767
|
79
|
|
|
|
|
361
|
return $text; |
|
768
|
|
|
|
|
|
|
} ## end sub Marpa::PP::show_postdot_set |
|
769
|
|
|
|
|
|
|
|
|
770
|
|
|
|
|
|
|
sub Marpa::PP::show_earley_set_list { |
|
771
|
12
|
|
|
12
|
0
|
23
|
my ( $recce, $earley_set_list ) = @_; |
|
772
|
12
|
|
|
|
|
30
|
my $text = q{}; |
|
773
|
12
|
|
|
|
|
27
|
my $earley_set_count = @{$earley_set_list}; |
|
|
12
|
|
|
|
|
36
|
|
|
774
|
12
|
|
|
|
|
96
|
LIST: for my $ix ( 0 .. $earley_set_count - 1 ) { |
|
775
|
79
|
|
|
|
|
130
|
my $set = $earley_set_list->[$ix]; |
|
776
|
79
|
50
|
|
|
|
175
|
next LIST if not defined $set; |
|
777
|
79
|
|
|
|
|
234
|
$text .= "Earley Set $ix\n" |
|
778
|
|
|
|
|
|
|
. Marpa::PP::show_earley_set( $recce, $set ); |
|
779
|
79
|
|
|
|
|
159
|
my $postdot_set = |
|
780
|
|
|
|
|
|
|
$earley_set_list->[$ix] |
|
781
|
|
|
|
|
|
|
->[Marpa::PP::Internal::Earley_Set::POSTDOT]; |
|
782
|
79
|
50
|
|
|
|
168
|
next LIST if not defined $postdot_set; |
|
783
|
79
|
|
|
|
|
156
|
$text .= Marpa::PP::show_postdot_set( $recce, $postdot_set ); |
|
784
|
|
|
|
|
|
|
} ## end for my $ix ( 0 .. $earley_set_count - 1 ) |
|
785
|
12
|
|
|
|
|
213
|
return $text; |
|
786
|
|
|
|
|
|
|
} ## end sub Marpa::PP::show_earley_set_list |
|
787
|
|
|
|
|
|
|
|
|
788
|
|
|
|
|
|
|
sub Marpa::PP::Recognizer::show_earley_sets { |
|
789
|
12
|
|
|
12
|
1
|
2868
|
my ($recce) = @_; |
|
790
|
12
|
|
50
|
|
|
59
|
my $last_completed_earleme = $recce->[LAST_COMPLETED_EARLEME] |
|
791
|
|
|
|
|
|
|
// 'stripped'; |
|
792
|
12
|
|
|
|
|
30
|
my $furthest_earleme = $recce->[FURTHEST_EARLEME]; |
|
793
|
12
|
|
|
|
|
28
|
my $earley_set_list = $recce->[EARLEY_SETS]; |
|
794
|
|
|
|
|
|
|
return |
|
795
|
12
|
|
|
|
|
99
|
"Last Completed: $last_completed_earleme; " |
|
796
|
|
|
|
|
|
|
. "Furthest: $furthest_earleme\n" |
|
797
|
|
|
|
|
|
|
. Marpa::PP::show_earley_set_list( $recce, $earley_set_list ); |
|
798
|
|
|
|
|
|
|
|
|
799
|
|
|
|
|
|
|
} ## end sub Marpa::PP::Recognizer::show_earley_sets |
|
800
|
|
|
|
|
|
|
|
|
801
|
|
|
|
|
|
|
BEGIN { |
|
802
|
44
|
|
|
44
|
|
272
|
my $structure = <<'END_OF_STRUCTURE'; |
|
803
|
|
|
|
|
|
|
|
|
804
|
|
|
|
|
|
|
:package=Marpa::PP::Internal::Progress_Report |
|
805
|
|
|
|
|
|
|
|
|
806
|
|
|
|
|
|
|
RULE_ID |
|
807
|
|
|
|
|
|
|
POSITION |
|
808
|
|
|
|
|
|
|
ORIGIN |
|
809
|
|
|
|
|
|
|
|
|
810
|
|
|
|
|
|
|
END_OF_STRUCTURE |
|
811
|
44
|
|
|
|
|
426
|
Marpa::PP::offset($structure); |
|
812
|
|
|
|
|
|
|
} ## end BEGIN |
|
813
|
|
|
|
|
|
|
|
|
814
|
|
|
|
|
|
|
sub Marpa::PP::Recognizer::show_progress { |
|
815
|
4
|
|
|
4
|
1
|
790
|
my ( $recce, $start_ordinal, $end_ordinal ) = @_; |
|
816
|
4
|
|
|
|
|
8
|
my $grammar = $recce->[Marpa::PP::Internal::Recognizer::GRAMMAR]; |
|
817
|
4
|
|
|
|
|
12
|
my $rules = $grammar->[Marpa::PP::Internal::Grammar::RULES]; |
|
818
|
|
|
|
|
|
|
|
|
819
|
4
|
|
|
|
|
9
|
my $earley_sets_by_ordinal = |
|
820
|
|
|
|
|
|
|
$recce->[Marpa::PP::Internal::Recognizer::EARLEY_SETS_BY_ORDINAL]; |
|
821
|
4
|
|
|
|
|
13
|
my $last_ordinal = $#{$earley_sets_by_ordinal}; |
|
|
4
|
|
|
|
|
10
|
|
|
822
|
|
|
|
|
|
|
|
|
823
|
4
|
|
|
|
|
22
|
my $start_ix; |
|
824
|
4
|
100
|
|
|
|
20
|
if ( not defined $start_ordinal ) { |
|
825
|
2
|
|
|
|
|
6
|
$start_ix = |
|
826
|
|
|
|
|
|
|
$recce->[Marpa::PP::Internal::Recognizer::LAST_COMPLETED_EARLEME]; |
|
827
|
|
|
|
|
|
|
} |
|
828
|
|
|
|
|
|
|
else { |
|
829
|
2
|
50
|
33
|
|
|
17
|
if ( $start_ordinal < 0 or $start_ordinal > $last_ordinal ) { |
|
830
|
|
|
|
|
|
|
return |
|
831
|
0
|
|
|
|
|
0
|
"Marpa::PP::Recognizer::show_progress start index is $start_ordinal, " |
|
832
|
|
|
|
|
|
|
. "must be in range 0-$last_ordinal"; |
|
833
|
|
|
|
|
|
|
} |
|
834
|
|
|
|
|
|
|
$start_ix = |
|
835
|
2
|
|
|
|
|
5
|
$earley_sets_by_ordinal->[$start_ordinal] |
|
836
|
|
|
|
|
|
|
->[Marpa::PP::Internal::Earley_Set::ORDINAL]; |
|
837
|
|
|
|
|
|
|
} ## end else [ if ( not defined $start_ordinal ) ] |
|
838
|
|
|
|
|
|
|
|
|
839
|
4
|
|
|
|
|
9
|
my $end_ix; |
|
840
|
4
|
100
|
|
|
|
15
|
if ( not defined $end_ordinal ) { |
|
841
|
3
|
|
|
|
|
7
|
$end_ix = $start_ix; |
|
842
|
|
|
|
|
|
|
} |
|
843
|
|
|
|
|
|
|
else { |
|
844
|
1
|
|
|
|
|
3
|
my $end_ordinal_argument = $end_ordinal; |
|
845
|
1
|
50
|
|
|
|
4
|
if ( $end_ordinal < 0 ) { |
|
846
|
1
|
|
|
|
|
3
|
$end_ordinal += $last_ordinal + 1; |
|
847
|
|
|
|
|
|
|
} |
|
848
|
1
|
50
|
|
|
|
3
|
if ( $end_ordinal < 0 ) { |
|
849
|
|
|
|
|
|
|
return |
|
850
|
0
|
|
|
|
|
0
|
"Marpa::PP::Recognizer::show_progress end index is $end_ordinal_argument, " |
|
851
|
|
|
|
|
|
|
. sprintf ' must be in range %d-%d', -( $last_ordinal + 1 ), |
|
852
|
|
|
|
|
|
|
$last_ordinal; |
|
853
|
|
|
|
|
|
|
} ## end if ( $end_ordinal < 0 ) |
|
854
|
|
|
|
|
|
|
$end_ix = |
|
855
|
1
|
|
|
|
|
3
|
$earley_sets_by_ordinal->[$end_ordinal] |
|
856
|
|
|
|
|
|
|
->[Marpa::PP::Internal::Earley_Set::ORDINAL]; |
|
857
|
|
|
|
|
|
|
} ## end else [ if ( not defined $end_ordinal ) ] |
|
858
|
|
|
|
|
|
|
|
|
859
|
4
|
|
|
|
|
13
|
my $text = q{}; |
|
860
|
4
|
|
|
|
|
22
|
for my $current ( $start_ix .. $end_ix ) { |
|
861
|
7
|
|
|
|
|
16
|
my %by_rule_by_position = (); |
|
862
|
7
|
|
|
|
|
27
|
my $reports = report_progress( $recce, $current ); |
|
863
|
|
|
|
|
|
|
|
|
864
|
7
|
|
|
|
|
14
|
for my $report ( @{$reports} ) { |
|
|
7
|
|
|
|
|
16
|
|
|
865
|
65
|
|
|
|
|
83
|
my $rule_id = |
|
866
|
|
|
|
|
|
|
$report->[Marpa::PP::Internal::Progress_Report::RULE_ID]; |
|
867
|
65
|
|
|
|
|
68
|
my $position = |
|
868
|
|
|
|
|
|
|
$report->[Marpa::PP::Internal::Progress_Report::POSITION]; |
|
869
|
65
|
|
|
|
|
76
|
my $origin = |
|
870
|
|
|
|
|
|
|
$report->[Marpa::PP::Internal::Progress_Report::ORIGIN]; |
|
871
|
|
|
|
|
|
|
|
|
872
|
65
|
|
|
|
|
224
|
$by_rule_by_position{$rule_id}->{$position}->{$origin}++; |
|
873
|
|
|
|
|
|
|
} ## end for my $report ( @{$reports} ) |
|
874
|
7
|
|
|
|
|
59
|
for my $rule_id ( sort { $a <=> $b } keys %by_rule_by_position ) { |
|
|
39
|
|
|
|
|
69
|
|
|
875
|
29
|
|
|
|
|
64
|
my $by_position = $by_rule_by_position{$rule_id}; |
|
876
|
29
|
|
|
|
|
37
|
for my $position ( sort { $a <=> $b } keys %{$by_position} ) { |
|
|
10
|
|
|
|
|
31
|
|
|
|
29
|
|
|
|
|
97
|
|
|
877
|
39
|
|
|
|
|
71
|
my $raw_origins = $by_position->{$position}; |
|
878
|
39
|
|
|
|
|
57
|
my @origins = sort { $a <=> $b } keys %{$raw_origins}; |
|
|
73
|
|
|
|
|
95
|
|
|
|
39
|
|
|
|
|
114
|
|
|
879
|
39
|
|
|
|
|
63
|
my $origins_count = scalar @origins; |
|
880
|
39
|
|
|
|
|
53
|
my $origin_desc; |
|
881
|
39
|
100
|
|
|
|
72
|
if ( $origins_count <= 3 ) { |
|
882
|
37
|
|
|
|
|
74
|
$origin_desc = join q{,}, @origins; |
|
883
|
|
|
|
|
|
|
} |
|
884
|
|
|
|
|
|
|
else { |
|
885
|
2
|
|
|
|
|
8
|
$origin_desc = $origins[0] . q{...} . $origins[-1]; |
|
886
|
|
|
|
|
|
|
} |
|
887
|
|
|
|
|
|
|
|
|
888
|
39
|
|
|
|
|
60
|
my $rule = $rules->[$rule_id]; |
|
889
|
39
|
|
|
|
|
68
|
my $rhs_length = |
|
890
|
39
|
|
|
|
|
52
|
scalar @{ $rule->[Marpa::PP::Internal::Rule::RHS] }; |
|
891
|
39
|
|
|
|
|
47
|
my $item_text; |
|
892
|
|
|
|
|
|
|
|
|
893
|
|
|
|
|
|
|
# flag indicating whether we need to show the dot in the rule |
|
894
|
39
|
100
|
|
|
|
98
|
if ( $position >= $rhs_length ) { |
|
|
|
100
|
|
|
|
|
|
|
895
|
18
|
|
|
|
|
32
|
$item_text .= "F$rule_id"; |
|
896
|
|
|
|
|
|
|
} |
|
897
|
|
|
|
|
|
|
elsif ($position) { |
|
898
|
5
|
|
|
|
|
13
|
$item_text .= "R$rule_id:$position"; |
|
899
|
|
|
|
|
|
|
} |
|
900
|
|
|
|
|
|
|
else { |
|
901
|
16
|
|
|
|
|
33
|
$item_text .= "P$rule_id"; |
|
902
|
|
|
|
|
|
|
} |
|
903
|
39
|
100
|
|
|
|
91
|
$item_text .= " x$origins_count" if $origins_count > 1; |
|
904
|
39
|
|
|
|
|
68
|
$item_text .= q{ @} . $origin_desc . q{-} . $current . q{ }; |
|
905
|
39
|
|
|
|
|
119
|
$item_text .= Marpa::PP::show_dotted_rule( $rule, $position ); |
|
906
|
39
|
|
|
|
|
233
|
$text .= $item_text . "\n"; |
|
907
|
|
|
|
|
|
|
} ## end for my $position ( sort { $a <=> $b } keys %{...}) |
|
908
|
|
|
|
|
|
|
} ## end for my $rule_id ( sort { $a <=> $b } keys ...) |
|
909
|
|
|
|
|
|
|
} ## end for my $current ( $start_ix .. $end_ix ) |
|
910
|
4
|
|
|
|
|
21
|
return $text; |
|
911
|
|
|
|
|
|
|
} ## end sub Marpa::PP::Recognizer::show_progress |
|
912
|
|
|
|
|
|
|
|
|
913
|
|
|
|
|
|
|
sub report_progress { |
|
914
|
7
|
|
|
7
|
|
14
|
my ( $recce, $current ) = @_; |
|
915
|
|
|
|
|
|
|
|
|
916
|
7
|
|
|
|
|
17
|
my $earley_set = |
|
917
|
|
|
|
|
|
|
$recce->[Marpa::PP::Internal::Recognizer::EARLEY_SETS]->[$current]; |
|
918
|
7
|
|
|
|
|
14
|
my $earley_items = $earley_set->[Marpa::PP::Internal::Earley_Set::ITEMS]; |
|
919
|
|
|
|
|
|
|
|
|
920
|
|
|
|
|
|
|
# Duplicates are not dealt with here -- they are more easily dealt |
|
921
|
|
|
|
|
|
|
# with when sorting, which is done in the display logic. |
|
922
|
7
|
|
|
|
|
30
|
my @worklist = (); |
|
923
|
7
|
|
|
|
|
13
|
for my $earley_item ( @{$earley_items} ) { |
|
|
7
|
|
|
|
|
18
|
|
|
924
|
30
|
|
|
|
|
53
|
my $AHFA_state = |
|
925
|
|
|
|
|
|
|
$earley_item->[Marpa::PP::Internal::Earley_Item::STATE]; |
|
926
|
30
|
|
|
|
|
48
|
my $origin = $earley_item->[Marpa::PP::Internal::Earley_Item::ORIGIN]; |
|
927
|
30
|
|
|
|
|
82
|
push @worklist, [ $origin, $AHFA_state ]; |
|
928
|
30
|
|
100
|
|
|
101
|
my $leo_links = |
|
929
|
|
|
|
|
|
|
$earley_item->[Marpa::PP::Internal::Earley_Item::LEO_LINKS] // []; |
|
930
|
30
|
|
|
|
|
36
|
for my $leo_link ( @{$leo_links} ) { |
|
|
30
|
|
|
|
|
92
|
|
|
931
|
|
|
|
|
|
|
|
|
932
|
|
|
|
|
|
|
# The predecessor is the Leo item, which |
|
933
|
|
|
|
|
|
|
# needs to be expanded |
|
934
|
2
|
|
|
|
|
6
|
my $leo_item = $leo_link->[0]; |
|
935
|
2
|
|
|
|
|
6
|
while ($leo_item) { |
|
936
|
22
|
|
|
|
|
36
|
my $leo_symbol_name = $leo_item |
|
937
|
|
|
|
|
|
|
->[Marpa::PP::Internal::Leo_Item::LEO_POSTDOT_SYMBOL]; |
|
938
|
22
|
|
|
|
|
31
|
my $leo_base_item = |
|
939
|
|
|
|
|
|
|
$leo_item->[Marpa::PP::Internal::Leo_Item::BASE]; |
|
940
|
22
|
|
|
|
|
51
|
my ( undef, $base_to_state ) = |
|
941
|
22
|
|
|
|
|
25
|
@{ $leo_base_item |
|
942
|
|
|
|
|
|
|
->[Marpa::PP::Internal::Earley_Item::STATE] |
|
943
|
|
|
|
|
|
|
->[Marpa::PP::Internal::AHFA::TRANSITION] |
|
944
|
|
|
|
|
|
|
->{$leo_symbol_name} }; |
|
945
|
22
|
|
|
|
|
66
|
push @worklist, |
|
946
|
|
|
|
|
|
|
[ |
|
947
|
|
|
|
|
|
|
$leo_item->[Marpa::PP::Internal::Leo_Item::SET], |
|
948
|
|
|
|
|
|
|
$base_to_state |
|
949
|
|
|
|
|
|
|
]; |
|
950
|
22
|
|
|
|
|
71
|
$leo_item = |
|
951
|
|
|
|
|
|
|
$leo_item->[Marpa::PP::Internal::Leo_Item::PREDECESSOR]; |
|
952
|
|
|
|
|
|
|
} ## end while ($leo_item) |
|
953
|
|
|
|
|
|
|
} ## end for my $leo_link ( @{$leo_links} ) |
|
954
|
|
|
|
|
|
|
} ## end for my $earley_item ( @{$earley_items} ) |
|
955
|
|
|
|
|
|
|
|
|
956
|
7
|
|
|
|
|
18
|
my @progress_report = (); |
|
957
|
7
|
|
|
|
|
15
|
for my $workitem (@worklist) { |
|
958
|
52
|
|
|
|
|
94
|
my ( $origin, $AHFA_state ) = @{$workitem}; |
|
|
52
|
|
|
|
|
85
|
|
|
959
|
52
|
|
|
|
|
82
|
my $NFA_states = $AHFA_state->[Marpa::PP::Internal::AHFA::NFA_STATES]; |
|
960
|
52
|
50
|
|
|
|
112
|
if ( not $NFA_states ) { |
|
961
|
0
|
|
|
|
|
0
|
Marpa::PP::exception( |
|
962
|
|
|
|
|
|
|
'Cannot report progress of Marpa::PP::Recognizer: it is stripped' |
|
963
|
|
|
|
|
|
|
); |
|
964
|
|
|
|
|
|
|
} |
|
965
|
52
|
|
|
|
|
62
|
NFA_STATE: for my $NFA_state ( @{$NFA_states} ) { |
|
|
52
|
|
|
|
|
88
|
|
|
966
|
65
|
|
|
|
|
95
|
my $LR0_item = $NFA_state->[Marpa::PP::Internal::NFA::ITEM]; |
|
967
|
65
|
|
|
|
|
88
|
my $marpa_rule = $LR0_item->[Marpa::PP::Internal::LR0_item::RULE]; |
|
968
|
65
|
|
|
|
|
76
|
my $marpa_position = |
|
969
|
|
|
|
|
|
|
$LR0_item->[Marpa::PP::Internal::LR0_item::POSITION]; |
|
970
|
|
|
|
|
|
|
|
|
971
|
65
|
|
|
|
|
77
|
my $original_rule = $marpa_rule; |
|
972
|
65
|
50
|
|
|
|
159
|
if ( $marpa_rule->[Marpa::PP::Internal::Rule::VIRTUAL_START] ) { |
|
973
|
0
|
|
|
|
|
0
|
$original_rule = |
|
974
|
|
|
|
|
|
|
$marpa_rule->[Marpa::PP::Internal::Rule::ORIGINAL_RULE]; |
|
975
|
|
|
|
|
|
|
} |
|
976
|
|
|
|
|
|
|
|
|
977
|
65
|
|
|
|
|
87
|
my $original_rhs = |
|
978
|
|
|
|
|
|
|
$original_rule->[Marpa::PP::Internal::Rule::RHS]; |
|
979
|
|
|
|
|
|
|
|
|
980
|
|
|
|
|
|
|
# position in original rule, to be calculated |
|
981
|
65
|
|
|
|
|
57
|
my $original_position; |
|
982
|
65
|
50
|
|
|
|
132
|
if ( my $chaf_start = |
|
983
|
|
|
|
|
|
|
$marpa_rule->[Marpa::PP::Internal::Rule::VIRTUAL_START] ) |
|
984
|
|
|
|
|
|
|
{ |
|
985
|
0
|
|
|
|
|
0
|
my $chaf_rhs = $marpa_rule->[Marpa::PP::Internal::Rule::RHS]; |
|
986
|
0
|
|
|
|
|
0
|
$original_position = |
|
987
|
0
|
|
|
|
|
0
|
$marpa_position >= scalar @{$chaf_rhs} |
|
988
|
0
|
0
|
|
|
|
0
|
? scalar @{$original_rhs} |
|
989
|
|
|
|
|
|
|
: ( $chaf_start + $marpa_position ); |
|
990
|
|
|
|
|
|
|
} ## end if ( my $chaf_start = $marpa_rule->[...]) |
|
991
|
65
|
|
66
|
|
|
207
|
$original_position //= $marpa_position; |
|
992
|
65
|
|
|
|
|
78
|
my $rule_id = $original_rule->[Marpa::PP::Internal::Rule::ID]; |
|
993
|
65
|
|
|
|
|
338
|
push @progress_report, |
|
994
|
|
|
|
|
|
|
[ $rule_id, $original_position, $origin, $current ]; |
|
995
|
|
|
|
|
|
|
} ## end for my $NFA_state ( @{$NFA_states} ) |
|
996
|
|
|
|
|
|
|
} ## end for my $workitem (@worklist) |
|
997
|
7
|
|
|
|
|
39
|
return \@progress_report; |
|
998
|
|
|
|
|
|
|
} ## end sub report_progress |
|
999
|
|
|
|
|
|
|
|
|
1000
|
|
|
|
|
|
|
sub Marpa::PP::Recognizer::read { |
|
1001
|
|
|
|
|
|
|
|
|
1002
|
|
|
|
|
|
|
# For efficiency, not unpacked |
|
1003
|
|
|
|
|
|
|
# my ( $recce, $symbol_name, $value ) = @_; |
|
1004
|
1788
|
|
|
1788
|
1
|
10710
|
my $recce = shift; |
|
1005
|
|
|
|
|
|
|
return |
|
1006
|
1788
|
100
|
|
|
|
7115
|
defined $recce->alternative(@_) ? $recce->earleme_complete() : undef; |
|
1007
|
|
|
|
|
|
|
} ## end sub Marpa::PP::Recognizer::read |
|
1008
|
|
|
|
|
|
|
|
|
1009
|
|
|
|
|
|
|
sub Marpa::PP::Recognizer::alternative { |
|
1010
|
|
|
|
|
|
|
|
|
1011
|
1961
|
|
|
1961
|
0
|
6745
|
my ( $recce, $symbol_name, $value, $length ) = @_; |
|
1012
|
|
|
|
|
|
|
|
|
1013
|
1961
|
50
|
|
|
|
6712
|
Marpa::PP::exception( |
|
1014
|
|
|
|
|
|
|
'Missing recognizer argument for Marpa::PP::Recognizer::alternative()' |
|
1015
|
|
|
|
|
|
|
) if not defined $recce; |
|
1016
|
|
|
|
|
|
|
|
|
1017
|
|
|
|
|
|
|
{ |
|
1018
|
1961
|
|
|
|
|
2812
|
my $recce_class = ref $recce; |
|
|
1961
|
|
|
|
|
3930
|
|
|
1019
|
1961
|
|
50
|
|
|
4955
|
$recce_class //= 'not defined'; |
|
1020
|
1961
|
50
|
|
|
|
7270
|
Marpa::PP::exception( |
|
1021
|
|
|
|
|
|
|
"recognizer argument of alternative() has wrong class\n", |
|
1022
|
|
|
|
|
|
|
'Class of argument is ', |
|
1023
|
|
|
|
|
|
|
$recce_class, |
|
1024
|
|
|
|
|
|
|
"\n", |
|
1025
|
|
|
|
|
|
|
"Class of argument should be Marpa::PP::Recognizer\n" |
|
1026
|
|
|
|
|
|
|
) if $recce_class ne 'Marpa::PP::Recognizer'; |
|
1027
|
|
|
|
|
|
|
} |
|
1028
|
|
|
|
|
|
|
|
|
1029
|
1961
|
|
|
|
|
13780
|
my $grammar = $recce->[Marpa::PP::Internal::Recognizer::GRAMMAR]; |
|
1030
|
1961
|
|
|
|
|
6245
|
local $Marpa::PP::Internal::TRACE_FH = my $trace_fh = |
|
1031
|
|
|
|
|
|
|
$recce->[Marpa::PP::Internal::Recognizer::TRACE_FILE_HANDLE]; |
|
1032
|
1961
|
|
|
|
|
3591
|
my $trace_terminals = |
|
1033
|
|
|
|
|
|
|
$recce->[Marpa::PP::Internal::Recognizer::TRACE_TERMINALS]; |
|
1034
|
1961
|
|
|
|
|
3095
|
my $warnings = $recce->[Marpa::PP::Internal::Recognizer::WARNINGS]; |
|
1035
|
|
|
|
|
|
|
|
|
1036
|
1961
|
50
|
|
|
|
6580
|
Marpa::PP::exception('Attempt to read token after parsing is finished') |
|
1037
|
|
|
|
|
|
|
if $recce->[Marpa::PP::Internal::Recognizer::FINISHED]; |
|
1038
|
|
|
|
|
|
|
|
|
1039
|
1961
|
50
|
|
|
|
4927
|
Marpa::PP::exception('Attempt to read token when parsing is exhausted') |
|
1040
|
|
|
|
|
|
|
if $recce->[Marpa::PP::Internal::Recognizer::EXHAUSTED]; |
|
1041
|
|
|
|
|
|
|
|
|
1042
|
1961
|
|
|
|
|
3911
|
my $terminal_names = |
|
1043
|
|
|
|
|
|
|
$grammar->[Marpa::PP::Internal::Grammar::TERMINAL_NAMES]; |
|
1044
|
|
|
|
|
|
|
|
|
1045
|
1961
|
|
|
|
|
4049
|
my $current_earleme = |
|
1046
|
|
|
|
|
|
|
$recce->[Marpa::PP::Internal::Recognizer::LAST_COMPLETED_EARLEME]; |
|
1047
|
1961
|
|
|
|
|
2739
|
my $earley_set_list = |
|
1048
|
|
|
|
|
|
|
$recce->[Marpa::PP::Internal::Recognizer::EARLEY_SETS]; |
|
1049
|
1961
|
|
|
|
|
2965
|
my $AHFA = $grammar->[Marpa::PP::Internal::Grammar::AHFA]; |
|
1050
|
1961
|
|
|
|
|
3443
|
my $symbols = $grammar->[Marpa::PP::Internal::Grammar::SYMBOLS]; |
|
1051
|
1961
|
|
|
|
|
2615
|
my $symbol_hash = $grammar->[Marpa::PP::Internal::Grammar::SYMBOL_HASH]; |
|
1052
|
|
|
|
|
|
|
|
|
1053
|
1961
|
|
|
|
|
3823
|
my $postdot_here = |
|
1054
|
|
|
|
|
|
|
$earley_set_list->[$current_earleme] |
|
1055
|
|
|
|
|
|
|
->[Marpa::PP::Internal::Earley_Set::POSTDOT]; |
|
1056
|
|
|
|
|
|
|
|
|
1057
|
1961
|
50
|
33
|
|
|
10427
|
if ( not defined $symbol_name or not $terminal_names->{$symbol_name} ) { |
|
1058
|
0
|
0
|
|
|
|
0
|
my $problem = |
|
1059
|
|
|
|
|
|
|
defined $symbol_name |
|
1060
|
|
|
|
|
|
|
? qq{Token name "$symbol_name" is not the name of a terminal symbol} |
|
1061
|
|
|
|
|
|
|
: q{Undef given, instead of the name of a terminal symbol}; |
|
1062
|
0
|
|
|
|
|
0
|
Marpa::PP::exception($problem); |
|
1063
|
|
|
|
|
|
|
} ## end if ( not defined $symbol_name or not $terminal_names...) |
|
1064
|
|
|
|
|
|
|
|
|
1065
|
1961
|
|
100
|
|
|
10209
|
$length //= 1; |
|
1066
|
|
|
|
|
|
|
|
|
1067
|
|
|
|
|
|
|
# Make sure it's an allowed terminal symbol. |
|
1068
|
1961
|
|
|
|
|
3399
|
my $postdot_data = $postdot_here->{$symbol_name}; |
|
1069
|
1961
|
100
|
|
|
|
5499
|
if ( not $postdot_data ) { |
|
1070
|
1
|
50
|
|
|
|
5
|
if ($trace_terminals) { |
|
1071
|
1
|
50
|
|
|
|
3
|
say {$trace_fh} qq{Rejected "$symbol_name" at $current_earleme-} |
|
|
1
|
|
|
|
|
11
|
|
|
1072
|
|
|
|
|
|
|
. ( $length + $current_earleme ) |
|
1073
|
|
|
|
|
|
|
or Marpa::PP::exception("Cannot print: $ERRNO"); |
|
1074
|
|
|
|
|
|
|
} |
|
1075
|
1
|
|
|
|
|
6
|
return; |
|
1076
|
|
|
|
|
|
|
} ## end if ( not $postdot_data ) |
|
1077
|
|
|
|
|
|
|
|
|
1078
|
1960
|
|
|
|
|
2800
|
my $value_ref = \($value); |
|
1079
|
|
|
|
|
|
|
|
|
1080
|
1960
|
100
|
|
|
|
5660
|
if ( $length & Marpa::PP::Internal::Recognizer::EARLEME_MASK ) { |
|
1081
|
1
|
|
|
|
|
463
|
Marpa::PP::exception( |
|
1082
|
|
|
|
|
|
|
'Token ' . $symbol_name . " is too long\n", |
|
1083
|
|
|
|
|
|
|
" Token starts at $current_earleme, and its length is $length\n" |
|
1084
|
|
|
|
|
|
|
); |
|
1085
|
|
|
|
|
|
|
} ## end if ( $length & Marpa::PP::Internal::Recognizer::EARLEME_MASK) |
|
1086
|
|
|
|
|
|
|
|
|
1087
|
1959
|
50
|
|
|
|
4831
|
if ( $length <= 0 ) { |
|
1088
|
0
|
|
|
|
|
0
|
Marpa::PP::exception( |
|
1089
|
|
|
|
|
|
|
'Token ' . $symbol_name . ' has non-positive length ' . $length ); |
|
1090
|
|
|
|
|
|
|
} |
|
1091
|
|
|
|
|
|
|
|
|
1092
|
1959
|
|
|
|
|
3066
|
my $end_earleme = $current_earleme + $length; |
|
1093
|
|
|
|
|
|
|
|
|
1094
|
1959
|
50
|
|
|
|
4295
|
Marpa::PP::exception( |
|
1095
|
|
|
|
|
|
|
'Token ' . $symbol_name . " makes parse too long\n", |
|
1096
|
|
|
|
|
|
|
" Token starts at $current_earleme, and its length is $length\n" |
|
1097
|
|
|
|
|
|
|
) if $end_earleme & Marpa::PP::Internal::Recognizer::EARLEME_MASK; |
|
1098
|
|
|
|
|
|
|
|
|
1099
|
1959
|
|
|
|
|
2477
|
my $accepted = 0; # for trace_terminals |
|
1100
|
1959
|
|
|
|
|
3702
|
my $target_ix = $current_earleme + $length; |
|
1101
|
1959
|
|
100
|
|
|
11034
|
my $target_earley_set = $earley_set_list->[$target_ix] //= []; |
|
1102
|
1959
|
|
100
|
|
|
10471
|
my $target_earley_items = |
|
1103
|
|
|
|
|
|
|
$target_earley_set->[Marpa::PP::Internal::Earley_Set::ITEMS] //= []; |
|
1104
|
1959
|
|
100
|
|
|
12456
|
my $target_hash = |
|
1105
|
|
|
|
|
|
|
$target_earley_set->[Marpa::PP::Internal::Earley_Set::HASH] //= {}; |
|
1106
|
|
|
|
|
|
|
|
|
1107
|
1959
|
|
|
|
|
2744
|
EARLEY_ITEM: for my $postdot_item ( @{$postdot_data} ) { |
|
|
1959
|
|
|
|
|
14533
|
|
|
1108
|
|
|
|
|
|
|
|
|
1109
|
2352
|
|
|
|
|
2867
|
my $origin; |
|
1110
|
|
|
|
|
|
|
my @to_states; |
|
1111
|
2352
|
100
|
|
|
|
7524
|
next EARLEY_ITEM if ref $postdot_item eq $LEO_CLASS; |
|
1112
|
|
|
|
|
|
|
{ |
|
1113
|
2345
|
|
|
|
|
4079
|
my $state = |
|
|
2345
|
|
|
|
|
4785
|
|
|
1114
|
|
|
|
|
|
|
$postdot_item->[Marpa::PP::Internal::Earley_Item::STATE]; |
|
1115
|
3210
|
|
|
|
|
7556
|
@to_states = |
|
1116
|
2345
|
|
|
|
|
6801
|
grep {ref} |
|
1117
|
2345
|
|
|
|
|
3196
|
@{ $state->[Marpa::PP::Internal::AHFA::TRANSITION] |
|
1118
|
|
|
|
|
|
|
->{$symbol_name} }; |
|
1119
|
2345
|
50
|
|
|
|
5877
|
next EARLEY_ITEM if not scalar @to_states; |
|
1120
|
2345
|
|
|
|
|
4999
|
$origin = |
|
1121
|
|
|
|
|
|
|
$postdot_item->[Marpa::PP::Internal::Earley_Item::ORIGIN]; |
|
1122
|
|
|
|
|
|
|
} |
|
1123
|
|
|
|
|
|
|
|
|
1124
|
2345
|
|
|
|
|
2709
|
$accepted++; |
|
1125
|
|
|
|
|
|
|
|
|
1126
|
2345
|
|
|
|
|
4451
|
TO_STATE: for my $to_state (@to_states) { |
|
1127
|
3150
|
|
|
|
|
5152
|
my $reset = $to_state->[Marpa::PP::Internal::AHFA::RESET_ORIGIN]; |
|
1128
|
3150
|
100
|
|
|
|
7483
|
my $new_origin = $reset ? $target_ix : $origin; |
|
1129
|
3150
|
|
|
|
|
4882
|
my $to_state_id = $to_state->[Marpa::PP::Internal::AHFA::ID]; |
|
1130
|
3150
|
|
|
|
|
6838
|
my $hash_key = join q{:}, $to_state_id, $new_origin; |
|
1131
|
3150
|
|
|
|
|
10089
|
my $target_item = $target_hash->{$hash_key}; |
|
1132
|
3150
|
100
|
|
|
|
6558
|
if ( defined $target_item ) { |
|
1133
|
110
|
100
|
|
|
|
594
|
next TO_STATE if $reset; |
|
1134
|
10
|
100
|
|
|
|
25
|
if ($postdot_item->[Marpa::PP::Internal::Earley_Item::ID] ~~ [ |
|
|
10
|
|
|
|
|
55
|
|
|
1135
|
|
|
|
|
|
|
map { |
|
1136
|
10
|
|
|
|
|
22
|
$_->[0]->[Marpa::PP::Internal::Earley_Item::ID] |
|
1137
|
|
|
|
|
|
|
} @{ |
|
1138
|
|
|
|
|
|
|
$target_item |
|
1139
|
|
|
|
|
|
|
->[Marpa::PP::Internal::Earley_Item::LINKS] |
|
1140
|
|
|
|
|
|
|
} |
|
1141
|
|
|
|
|
|
|
] |
|
1142
|
|
|
|
|
|
|
) |
|
1143
|
|
|
|
|
|
|
{ |
|
1144
|
2
|
|
|
|
|
713
|
Marpa::PP::exception( |
|
1145
|
|
|
|
|
|
|
qq{"$symbol_name" already scanned with length $length at location $current_earleme} |
|
1146
|
|
|
|
|
|
|
); |
|
1147
|
|
|
|
|
|
|
} ## end if ( $postdot_item->[...]) |
|
1148
|
|
|
|
|
|
|
} ## end if ( defined $target_item ) |
|
1149
|
|
|
|
|
|
|
else { |
|
1150
|
|
|
|
|
|
|
|
|
1151
|
3040
|
|
|
|
|
5020
|
$target_item = []; |
|
1152
|
3040
|
|
|
|
|
7935
|
$target_item->[Marpa::PP::Internal::Earley_Item::ID] = |
|
1153
|
|
|
|
|
|
|
$recce |
|
1154
|
|
|
|
|
|
|
->[ Marpa::PP::Internal::Recognizer::NEXT_EARLEY_ITEM_ID |
|
1155
|
|
|
|
|
|
|
]++; |
|
1156
|
3040
|
|
|
|
|
4517
|
$target_item->[Marpa::PP::Internal::Earley_Item::STATE] = |
|
1157
|
|
|
|
|
|
|
$to_state; |
|
1158
|
3040
|
|
|
|
|
7167
|
$target_item->[Marpa::PP::Internal::Earley_Item::ORIGIN] = |
|
1159
|
|
|
|
|
|
|
$new_origin; |
|
1160
|
3040
|
|
|
|
|
5615
|
$target_item->[Marpa::PP::Internal::Earley_Item::LEO_LINKS] = |
|
1161
|
|
|
|
|
|
|
[]; |
|
1162
|
3040
|
|
|
|
|
5408
|
$target_item->[Marpa::PP::Internal::Earley_Item::LINKS] = []; |
|
1163
|
3040
|
|
|
|
|
5694
|
$target_item->[Marpa::PP::Internal::Earley_Item::SET] = |
|
1164
|
|
|
|
|
|
|
$target_ix; |
|
1165
|
3040
|
|
|
|
|
8472
|
$target_hash->{$hash_key} = $target_item; |
|
1166
|
3040
|
|
|
|
|
3591
|
push @{$target_earley_items}, $target_item; |
|
|
3040
|
|
|
|
|
6371
|
|
|
1167
|
|
|
|
|
|
|
|
|
1168
|
|
|
|
|
|
|
} ## end else [ if ( defined $target_item ) ] |
|
1169
|
|
|
|
|
|
|
|
|
1170
|
3048
|
100
|
|
|
|
10843
|
next TO_STATE if $reset; |
|
1171
|
|
|
|
|
|
|
|
|
1172
|
2343
|
|
|
|
|
2947
|
push @{ $target_item->[Marpa::PP::Internal::Earley_Item::LINKS] }, |
|
|
2343
|
|
|
|
|
12540
|
|
|
1173
|
|
|
|
|
|
|
[ $postdot_item, undef, $symbol_name, $value_ref ]; |
|
1174
|
|
|
|
|
|
|
} # for my $to_state |
|
1175
|
|
|
|
|
|
|
|
|
1176
|
|
|
|
|
|
|
} ## end for my $postdot_item ( @{$postdot_data} ) |
|
1177
|
|
|
|
|
|
|
|
|
1178
|
1957
|
100
|
66
|
|
|
12246
|
if ( $accepted |
|
1179
|
|
|
|
|
|
|
and $target_ix |
|
1180
|
|
|
|
|
|
|
> $recce->[Marpa::PP::Internal::Recognizer::FURTHEST_EARLEME] ) |
|
1181
|
|
|
|
|
|
|
{ |
|
1182
|
1897
|
|
|
|
|
3023
|
$recce->[Marpa::PP::Internal::Recognizer::FURTHEST_EARLEME] = |
|
1183
|
|
|
|
|
|
|
$target_ix; |
|
1184
|
|
|
|
|
|
|
} ## end if ( $accepted and $target_ix > $recce->[...]) |
|
1185
|
|
|
|
|
|
|
|
|
1186
|
1957
|
100
|
|
|
|
4374
|
if ($trace_terminals) { |
|
1187
|
10
|
50
|
|
|
|
22
|
my $verb = $accepted ? 'Accepted' : 'Rejected'; |
|
1188
|
10
|
50
|
|
|
|
10
|
say {$trace_fh} qq{$verb "$symbol_name" at $current_earleme-} |
|
|
10
|
|
|
|
|
64
|
|
|
1189
|
|
|
|
|
|
|
. ( $length + $current_earleme ) |
|
1190
|
|
|
|
|
|
|
or Marpa::PP::exception("Cannot print: $ERRNO"); |
|
1191
|
|
|
|
|
|
|
} ## end if ($trace_terminals) |
|
1192
|
|
|
|
|
|
|
|
|
1193
|
1957
|
|
|
|
|
13291
|
return $current_earleme; |
|
1194
|
|
|
|
|
|
|
|
|
1195
|
|
|
|
|
|
|
} ## end sub Marpa::PP::Recognizer::alternative |
|
1196
|
|
|
|
|
|
|
|
|
1197
|
|
|
|
|
|
|
# Deprecated -- obsolete |
|
1198
|
|
|
|
|
|
|
sub Marpa::PP::Recognizer::tokens { |
|
1199
|
|
|
|
|
|
|
|
|
1200
|
70
|
|
|
70
|
1
|
3918
|
my ( $recce, $tokens, $token_ix_ref ) = @_; |
|
1201
|
|
|
|
|
|
|
|
|
1202
|
70
|
50
|
|
|
|
152
|
Marpa::PP::exception( |
|
1203
|
|
|
|
|
|
|
'Missing recognizer argument for Marpa::PP::Recognizer::tokens()') |
|
1204
|
|
|
|
|
|
|
if not defined $recce; |
|
1205
|
|
|
|
|
|
|
|
|
1206
|
|
|
|
|
|
|
{ |
|
1207
|
70
|
|
|
|
|
80
|
my $recce_class = ref $recce; |
|
|
70
|
|
|
|
|
101
|
|
|
1208
|
70
|
|
50
|
|
|
135
|
$recce_class //= 'not defined'; |
|
1209
|
70
|
50
|
|
|
|
254
|
Marpa::PP::exception( |
|
1210
|
|
|
|
|
|
|
"recognizer argument of tokens() has wrong class\n", |
|
1211
|
|
|
|
|
|
|
'Class of argument is ', |
|
1212
|
|
|
|
|
|
|
$recce_class, |
|
1213
|
|
|
|
|
|
|
"\n", |
|
1214
|
|
|
|
|
|
|
"Class of argument should be Marpa::PP::Recognizer\n" |
|
1215
|
|
|
|
|
|
|
) if $recce_class ne 'Marpa::PP::Recognizer'; |
|
1216
|
|
|
|
|
|
|
} |
|
1217
|
|
|
|
|
|
|
|
|
1218
|
70
|
50
|
|
|
|
369
|
Marpa::PP::exception('No tokens arg for Marpa::PP::Recognizer::tokens()') |
|
1219
|
|
|
|
|
|
|
if not defined $tokens; |
|
1220
|
|
|
|
|
|
|
|
|
1221
|
70
|
|
|
|
|
106
|
my $mode = $recce->[Marpa::PP::Internal::Recognizer::MODE]; |
|
1222
|
70
|
|
|
|
|
67
|
my $interactive; |
|
1223
|
|
|
|
|
|
|
|
|
1224
|
70
|
50
|
|
|
|
153
|
if ( defined $token_ix_ref ) { |
|
1225
|
0
|
|
|
|
|
0
|
my $ref_type = ref $token_ix_ref; |
|
1226
|
0
|
0
|
|
|
|
0
|
if ( ref $token_ix_ref ne 'SCALAR' ) { |
|
1227
|
0
|
0
|
|
|
|
0
|
my $description = $ref_type ? "ref to $ref_type" : 'not a ref'; |
|
1228
|
0
|
|
|
|
|
0
|
Marpa::PP::exception( |
|
1229
|
|
|
|
|
|
|
"Token index arg for Marpa::PP::Recognizer::tokens is $description, must be ref to SCALAR" |
|
1230
|
|
|
|
|
|
|
); |
|
1231
|
|
|
|
|
|
|
} ## end if ( ref $token_ix_ref ne 'SCALAR' ) |
|
1232
|
|
|
|
|
|
|
Marpa::PP::exception( |
|
1233
|
0
|
0
|
|
|
|
0
|
q{'Tokens index ref for Marpa::PP::Recognizer::tokens allowed only in 'stream' mode} |
|
1234
|
|
|
|
|
|
|
) if $mode ne 'stream'; |
|
1235
|
0
|
|
|
|
|
0
|
$interactive = 1; |
|
1236
|
|
|
|
|
|
|
} ## end if ( defined $token_ix_ref ) |
|
1237
|
|
|
|
|
|
|
|
|
1238
|
70
|
|
|
|
|
99
|
my $grammar = $recce->[Marpa::PP::Internal::Recognizer::GRAMMAR]; |
|
1239
|
70
|
|
|
|
|
170
|
local $Marpa::PP::Internal::TRACE_FH = my $trace_fh = |
|
1240
|
|
|
|
|
|
|
$recce->[Marpa::PP::Internal::Recognizer::TRACE_FILE_HANDLE]; |
|
1241
|
70
|
|
|
|
|
86
|
my $trace_terminals = |
|
1242
|
|
|
|
|
|
|
$recce->[Marpa::PP::Internal::Recognizer::TRACE_TERMINALS]; |
|
1243
|
|
|
|
|
|
|
|
|
1244
|
0
|
|
|
|
|
0
|
Marpa::PP::exception('Attempt to scan tokens after parsing is finished') |
|
1245
|
|
|
|
|
|
|
if $recce->[Marpa::PP::Internal::Recognizer::FINISHED] |
|
1246
|
70
|
0
|
50
|
|
|
152
|
and scalar @{$tokens}; |
|
1247
|
|
|
|
|
|
|
|
|
1248
|
0
|
|
|
|
|
0
|
Marpa::PP::exception('Attempt to scan tokens when parsing is exhausted') |
|
1249
|
|
|
|
|
|
|
if $recce->[Marpa::PP::Internal::Recognizer::EXHAUSTED] |
|
1250
|
70
|
0
|
50
|
|
|
131
|
and scalar @{$tokens}; |
|
1251
|
|
|
|
|
|
|
|
|
1252
|
70
|
|
|
|
|
93
|
my $symbol_hash = $grammar->[Marpa::PP::Internal::Grammar::SYMBOL_HASH]; |
|
1253
|
|
|
|
|
|
|
|
|
1254
|
70
|
|
|
|
|
90
|
my $next_token_earleme = my $last_completed_earleme = |
|
1255
|
|
|
|
|
|
|
$recce->[Marpa::PP::Internal::Recognizer::LAST_COMPLETED_EARLEME]; |
|
1256
|
|
|
|
|
|
|
|
|
1257
|
70
|
|
50
|
|
|
249
|
$token_ix_ref //= \( my $token_ix = 0 ); |
|
1258
|
|
|
|
|
|
|
|
|
1259
|
70
|
|
|
|
|
95
|
my $token_args = $tokens->[ ${$token_ix_ref} ]; |
|
|
70
|
|
|
|
|
107
|
|
|
1260
|
|
|
|
|
|
|
|
|
1261
|
|
|
|
|
|
|
# If the token list is empty, we will go straight to the |
|
1262
|
|
|
|
|
|
|
# next token |
|
1263
|
70
|
100
|
|
|
|
96
|
if ( not scalar @{$tokens} ) { $next_token_earleme++ } |
|
|
70
|
|
|
|
|
160
|
|
|
|
56
|
|
|
|
|
68
|
|
|
1264
|
|
|
|
|
|
|
|
|
1265
|
70
|
|
|
|
|
90
|
EARLEME: while ( ${$token_ix_ref} < scalar @{$tokens} ) { |
|
|
87
|
|
|
|
|
107
|
|
|
|
87
|
|
|
|
|
339
|
|
|
1266
|
|
|
|
|
|
|
|
|
1267
|
17
|
|
|
|
|
22
|
my $current_token_earleme = $last_completed_earleme; |
|
1268
|
|
|
|
|
|
|
|
|
1269
|
|
|
|
|
|
|
# At this point, typically, $current_token_earleme, |
|
1270
|
|
|
|
|
|
|
# $next_token_earleme and $last_completed_earleme are |
|
1271
|
|
|
|
|
|
|
# all equal. |
|
1272
|
|
|
|
|
|
|
|
|
1273
|
|
|
|
|
|
|
# It's not 100% clear whether it's best to leave |
|
1274
|
|
|
|
|
|
|
# the token_ix_ref pointing at the start of the |
|
1275
|
|
|
|
|
|
|
# earleme, or at the actual problem token. |
|
1276
|
|
|
|
|
|
|
# Right now, we set it at the actual problem |
|
1277
|
|
|
|
|
|
|
# token, which is probably what will turn out |
|
1278
|
|
|
|
|
|
|
# to be easiest. |
|
1279
|
|
|
|
|
|
|
# my $first_ix_of_this_earleme = ${$token_ix_ref}; |
|
1280
|
|
|
|
|
|
|
|
|
1281
|
|
|
|
|
|
|
# For as long the $next_token_earleme does not advance ... |
|
1282
|
17
|
|
|
|
|
36
|
TOKEN: while ( $current_token_earleme == $next_token_earleme ) { |
|
1283
|
|
|
|
|
|
|
|
|
1284
|
|
|
|
|
|
|
# ... or until we run out of tokens |
|
1285
|
32
|
100
|
|
|
|
41
|
last TOKEN if not my $token_args = $tokens->[ ${$token_ix_ref} ]; |
|
|
32
|
|
|
|
|
81
|
|
|
1286
|
0
|
|
|
|
|
0
|
Marpa::PP::exception( |
|
1287
|
|
|
|
|
|
|
'Tokens must be array refs: token #', |
|
1288
|
19
|
50
|
|
|
|
64
|
${$token_ix_ref}, " is $token_args\n", |
|
1289
|
|
|
|
|
|
|
) if ref $token_args ne 'ARRAY'; |
|
1290
|
19
|
|
|
|
|
24
|
${$token_ix_ref}++; |
|
|
19
|
|
|
|
|
92
|
|
|
1291
|
19
|
|
|
|
|
21
|
my ( $symbol_name, $value, $length, $offset ) = @{$token_args}; |
|
|
19
|
|
|
|
|
41
|
|
|
1292
|
|
|
|
|
|
|
|
|
1293
|
19
|
50
|
|
|
|
44
|
Marpa::PP::exception( |
|
1294
|
|
|
|
|
|
|
"Attempt to add token '$symbol_name' at location where processing is complete:\n", |
|
1295
|
|
|
|
|
|
|
" Add attempted at $current_token_earleme\n", |
|
1296
|
|
|
|
|
|
|
" Processing complete to $last_completed_earleme\n" |
|
1297
|
|
|
|
|
|
|
) if $current_token_earleme < $last_completed_earleme; |
|
1298
|
|
|
|
|
|
|
|
|
1299
|
19
|
|
|
|
|
38
|
my $symbol_id = $symbol_hash->{$symbol_name}; |
|
1300
|
19
|
50
|
|
|
|
45
|
if ( not defined $symbol_id ) { |
|
1301
|
0
|
0
|
|
|
|
0
|
say {$trace_fh} |
|
|
0
|
|
|
|
|
0
|
|
|
1302
|
|
|
|
|
|
|
qq{Attempted to add non-existent symbol named "$symbol_name" at $last_completed_earleme\n} |
|
1303
|
|
|
|
|
|
|
or Marpa::PP::exception("Cannot print: $ERRNO"); |
|
1304
|
|
|
|
|
|
|
} |
|
1305
|
|
|
|
|
|
|
|
|
1306
|
19
|
|
|
|
|
62
|
my $result = $recce->alternative( $symbol_name, $value, $length ); |
|
1307
|
|
|
|
|
|
|
|
|
1308
|
19
|
50
|
|
|
|
42
|
if ( not defined $result ) { |
|
1309
|
0
|
0
|
|
|
|
0
|
if ( not $interactive ) { |
|
1310
|
0
|
|
|
|
|
0
|
Marpa::PP::exception( |
|
1311
|
|
|
|
|
|
|
qq{Terminal "$symbol_name" received when not expected} |
|
1312
|
|
|
|
|
|
|
); |
|
1313
|
|
|
|
|
|
|
} |
|
1314
|
|
|
|
|
|
|
|
|
1315
|
|
|
|
|
|
|
# Current token didn't actually work, so back out |
|
1316
|
|
|
|
|
|
|
# the increment |
|
1317
|
0
|
|
|
|
|
0
|
${$token_ix_ref}--; |
|
|
0
|
|
|
|
|
0
|
|
|
1318
|
|
|
|
|
|
|
|
|
1319
|
0
|
|
|
|
|
0
|
return $recce->status(); |
|
1320
|
|
|
|
|
|
|
} ## end if ( not defined $result ) |
|
1321
|
|
|
|
|
|
|
|
|
1322
|
19
|
|
100
|
|
|
43
|
$offset //= 1; |
|
1323
|
19
|
50
|
|
|
|
39
|
Marpa::PP::exception( |
|
1324
|
|
|
|
|
|
|
'Token ' . $symbol_name . " has negative offset\n", |
|
1325
|
|
|
|
|
|
|
" Token starts at $last_completed_earleme, and its length is $length\n", |
|
1326
|
|
|
|
|
|
|
" Tokens are required to be in sequence by location\n", |
|
1327
|
|
|
|
|
|
|
) if $offset < 0; |
|
1328
|
19
|
|
|
|
|
59
|
$next_token_earleme += $offset; |
|
1329
|
|
|
|
|
|
|
|
|
1330
|
|
|
|
|
|
|
} ## end while ( $current_token_earleme == $next_token_earleme ) |
|
1331
|
|
|
|
|
|
|
|
|
1332
|
|
|
|
|
|
|
# We've ended the loop for the tokens at $current_token_earleme. |
|
1333
|
|
|
|
|
|
|
# It is possible that $next_token_earleme did not advance, |
|
1334
|
|
|
|
|
|
|
# and the loop ended when we ran out of tokens in the |
|
1335
|
|
|
|
|
|
|
# argument list. |
|
1336
|
|
|
|
|
|
|
# We arrange it so that the last descriptor in |
|
1337
|
|
|
|
|
|
|
# a tokens call always advances the current earleme by at least one -- |
|
1338
|
|
|
|
|
|
|
# as if it had incremented $next_token_earleme |
|
1339
|
17
|
|
|
|
|
24
|
$current_token_earleme++; |
|
1340
|
17
|
50
|
|
|
|
37
|
$current_token_earleme = $next_token_earleme |
|
1341
|
|
|
|
|
|
|
if $next_token_earleme > $current_token_earleme; |
|
1342
|
|
|
|
|
|
|
|
|
1343
|
17
|
|
|
|
|
48
|
$recce->earleme_complete(); |
|
1344
|
17
|
|
|
|
|
27
|
$last_completed_earleme++; |
|
1345
|
|
|
|
|
|
|
|
|
1346
|
|
|
|
|
|
|
} ## end while ( ${$token_ix_ref} < scalar @{$tokens} ) |
|
1347
|
|
|
|
|
|
|
|
|
1348
|
70
|
100
|
|
|
|
157
|
if ( $mode eq 'stream' ) { |
|
1349
|
69
|
|
|
|
|
130
|
while ( $last_completed_earleme < $next_token_earleme ) { |
|
1350
|
56
|
|
|
|
|
125
|
$recce->earleme_complete(); |
|
1351
|
56
|
|
|
|
|
137
|
$last_completed_earleme++; |
|
1352
|
|
|
|
|
|
|
} |
|
1353
|
|
|
|
|
|
|
} ## end if ( $mode eq 'stream' ) |
|
1354
|
|
|
|
|
|
|
|
|
1355
|
70
|
100
|
|
|
|
144
|
if ( $mode eq 'default' ) { |
|
1356
|
1
|
|
|
|
|
5
|
while ( $last_completed_earleme |
|
1357
|
|
|
|
|
|
|
< $recce->[Marpa::PP::Internal::Recognizer::FURTHEST_EARLEME] ) |
|
1358
|
|
|
|
|
|
|
{ |
|
1359
|
0
|
|
|
|
|
0
|
$recce->earleme_complete(); |
|
1360
|
0
|
|
|
|
|
0
|
$last_completed_earleme++; |
|
1361
|
|
|
|
|
|
|
} ## end while ( $last_completed_earleme < $recce->[...]) |
|
1362
|
1
|
|
|
|
|
3
|
$recce->[Marpa::PP::Internal::Recognizer::FINISHED] = 1; |
|
1363
|
|
|
|
|
|
|
} ## end if ( $mode eq 'default' ) |
|
1364
|
|
|
|
|
|
|
|
|
1365
|
70
|
|
|
|
|
161
|
return $recce->status(); |
|
1366
|
|
|
|
|
|
|
|
|
1367
|
|
|
|
|
|
|
} ## end sub Marpa::PP::Recognizer::tokens |
|
1368
|
|
|
|
|
|
|
|
|
1369
|
|
|
|
|
|
|
# Perform the completion step on an earley set |
|
1370
|
|
|
|
|
|
|
|
|
1371
|
|
|
|
|
|
|
sub Marpa::PP::Recognizer::end_input { |
|
1372
|
103
|
|
|
103
|
0
|
850
|
my ($recce) = @_; |
|
1373
|
103
|
|
|
|
|
199
|
my $last_completed_earleme = |
|
1374
|
|
|
|
|
|
|
$recce->[Marpa::PP::Internal::Recognizer::LAST_COMPLETED_EARLEME]; |
|
1375
|
103
|
|
|
|
|
216
|
my $furthest_earleme = |
|
1376
|
|
|
|
|
|
|
$recce->[Marpa::PP::Internal::Recognizer::FURTHEST_EARLEME]; |
|
1377
|
103
|
|
|
|
|
344
|
while ( $last_completed_earleme < $furthest_earleme ) { |
|
1378
|
20030
|
|
|
|
|
50286
|
$recce->earleme_complete(); |
|
1379
|
20030
|
|
|
|
|
57628
|
$last_completed_earleme++; |
|
1380
|
|
|
|
|
|
|
} |
|
1381
|
103
|
|
|
|
|
178
|
$recce->[Marpa::PP::Internal::Recognizer::FINISHED] = 1; |
|
1382
|
103
|
|
|
|
|
230
|
return 1; |
|
1383
|
|
|
|
|
|
|
} ## end sub Marpa::PP::Recognizer::end_input |
|
1384
|
|
|
|
|
|
|
|
|
1385
|
|
|
|
|
|
|
sub Marpa::PP::Recognizer::earleme_complete { |
|
1386
|
22048
|
|
|
22048
|
0
|
36557
|
my ($recce) = @_; |
|
1387
|
|
|
|
|
|
|
|
|
1388
|
22048
|
|
|
|
|
37326
|
my $recce_c = $recce->[Marpa::PP::Internal::Recognizer::C]; |
|
1389
|
22048
|
|
|
|
|
49705
|
local $Marpa::PP::Internal::TRACE_FH = |
|
1390
|
|
|
|
|
|
|
$recce->[Marpa::PP::Internal::Recognizer::TRACE_FILE_HANDLE]; |
|
1391
|
22048
|
|
|
|
|
42980
|
my $grammar = $recce->[Marpa::PP::Internal::Recognizer::GRAMMAR]; |
|
1392
|
22048
|
|
|
|
|
32823
|
my $AHFA = $grammar->[Marpa::PP::Internal::Grammar::AHFA]; |
|
1393
|
22048
|
|
|
|
|
33690
|
my $symbol_hash = $grammar->[Marpa::PP::Internal::Grammar::SYMBOL_HASH]; |
|
1394
|
22048
|
|
|
|
|
31120
|
my $symbols = $grammar->[Marpa::PP::Internal::Grammar::SYMBOLS]; |
|
1395
|
22048
|
|
|
|
|
31230
|
my $earley_set_list = |
|
1396
|
|
|
|
|
|
|
$recce->[Marpa::PP::Internal::Recognizer::EARLEY_SETS]; |
|
1397
|
|
|
|
|
|
|
|
|
1398
|
22048
|
|
|
|
|
30255
|
my $terminal_names = |
|
1399
|
|
|
|
|
|
|
$grammar->[Marpa::PP::Internal::Grammar::TERMINAL_NAMES]; |
|
1400
|
22048
|
|
|
|
|
32252
|
my $too_many_earley_items = |
|
1401
|
|
|
|
|
|
|
$recce->[Marpa::PP::Internal::Recognizer::TOO_MANY_EARLEY_ITEMS]; |
|
1402
|
22048
|
|
|
|
|
30126
|
my $trace_earley_sets = |
|
1403
|
|
|
|
|
|
|
$recce->[Marpa::PP::Internal::Recognizer::TRACE_EARLEY_SETS]; |
|
1404
|
22048
|
|
100
|
|
|
90356
|
my $trace_terminals = |
|
1405
|
|
|
|
|
|
|
$recce->[Marpa::PP::Internal::Recognizer::TRACE_TERMINALS] // 0; |
|
1406
|
|
|
|
|
|
|
|
|
1407
|
22048
|
|
|
|
|
36380
|
my $earleme_to_complete = |
|
1408
|
|
|
|
|
|
|
++$recce->[Marpa::PP::Internal::Recognizer::LAST_COMPLETED_EARLEME]; |
|
1409
|
|
|
|
|
|
|
|
|
1410
|
22048
|
|
100
|
|
|
121266
|
my $earley_set = $earley_set_list->[$earleme_to_complete] //= []; |
|
1411
|
22048
|
|
100
|
|
|
118491
|
my $earley_items = |
|
1412
|
|
|
|
|
|
|
$earley_set->[Marpa::PP::Internal::Earley_Set::ITEMS] //= []; |
|
1413
|
22048
|
|
100
|
|
|
109579
|
my $earley_hash = $earley_set->[Marpa::PP::Internal::Earley_Set::HASH] //= |
|
1414
|
|
|
|
|
|
|
{}; |
|
1415
|
22048
|
|
50
|
|
|
93359
|
my $postdot_here = |
|
1416
|
|
|
|
|
|
|
$earley_set->[Marpa::PP::Internal::Earley_Set::POSTDOT] //= {}; |
|
1417
|
|
|
|
|
|
|
|
|
1418
|
|
|
|
|
|
|
# Important: more earley sets can be added in the loop |
|
1419
|
22048
|
|
|
|
|
33399
|
my $earley_set_ix = -1; |
|
1420
|
22048
|
|
|
|
|
48536
|
EARLEY_ITEM: while (1) { |
|
1421
|
|
|
|
|
|
|
|
|
1422
|
39315
|
|
|
|
|
111930
|
my $earley_item = $earley_items->[ ++$earley_set_ix ]; |
|
1423
|
39315
|
100
|
|
|
|
111252
|
last EARLEY_ITEM if not defined $earley_item; |
|
1424
|
|
|
|
|
|
|
|
|
1425
|
17267
|
|
|
|
|
23249
|
my ( $state, $parent ) = @{$earley_item}[ |
|
|
17267
|
|
|
|
|
39979
|
|
|
1426
|
|
|
|
|
|
|
Marpa::PP::Internal::Earley_Item::STATE, |
|
1427
|
|
|
|
|
|
|
Marpa::PP::Internal::Earley_Item::ORIGIN |
|
1428
|
|
|
|
|
|
|
]; |
|
1429
|
17267
|
|
|
|
|
24977
|
my $state_id = $state->[Marpa::PP::Internal::AHFA::ID]; |
|
1430
|
|
|
|
|
|
|
|
|
1431
|
17267
|
100
|
|
|
|
41230
|
next EARLEY_ITEM if $earleme_to_complete == $parent; |
|
1432
|
|
|
|
|
|
|
|
|
1433
|
16095
|
|
|
|
|
39649
|
LHS_SYMBOL: |
|
1434
|
16095
|
|
|
|
|
18202
|
for my $lhs_symbol ( |
|
1435
|
|
|
|
|
|
|
@{ $state->[Marpa::PP::Internal::AHFA::COMPLETE_LHS] } ) |
|
1436
|
|
|
|
|
|
|
{ |
|
1437
|
14971
|
|
|
|
|
40349
|
my $postdot_data = |
|
1438
|
|
|
|
|
|
|
$earley_set_list->[$parent] |
|
1439
|
|
|
|
|
|
|
->[Marpa::PP::Internal::Earley_Set::POSTDOT]->{$lhs_symbol}; |
|
1440
|
14971
|
100
|
|
|
|
32674
|
next LHS_SYMBOL if not defined $postdot_data; |
|
1441
|
14062
|
|
|
|
|
31916
|
PARENT_ITEM: |
|
1442
|
14062
|
|
|
|
|
15077
|
for my $postdot_item ( @{$postdot_data} ) { |
|
1443
|
18060
|
|
|
|
|
25229
|
my $parent_origin; |
|
1444
|
|
|
|
|
|
|
my @transition_states; |
|
1445
|
|
|
|
|
|
|
|
|
1446
|
18060
|
|
|
|
|
38015
|
my $postdot_item_is_leo = ref $postdot_item eq $LEO_CLASS; |
|
1447
|
18060
|
100
|
|
|
|
32822
|
if ($postdot_item_is_leo) { |
|
1448
|
1828
|
|
|
|
|
3709
|
$parent_origin = $postdot_item |
|
1449
|
|
|
|
|
|
|
->[Marpa::PP::Internal::Leo_Item::ORIGIN]; |
|
1450
|
1828
|
|
|
|
|
4587
|
@transition_states = $postdot_item |
|
1451
|
|
|
|
|
|
|
->[Marpa::PP::Internal::Leo_Item::TOP_TO_STATE]; |
|
1452
|
|
|
|
|
|
|
} ## end if ($postdot_item_is_leo) |
|
1453
|
|
|
|
|
|
|
else { |
|
1454
|
16232
|
|
|
|
|
29834
|
my $parent_state = $postdot_item |
|
1455
|
|
|
|
|
|
|
->[Marpa::PP::Internal::Earley_Item::STATE]; |
|
1456
|
25398
|
|
|
|
|
85431
|
@transition_states = |
|
1457
|
16232
|
|
|
|
|
55437
|
grep {ref} |
|
1458
|
16232
|
|
|
|
|
23428
|
@{ $parent_state |
|
1459
|
|
|
|
|
|
|
->[Marpa::PP::Internal::AHFA::TRANSITION] |
|
1460
|
|
|
|
|
|
|
->{$lhs_symbol} }; |
|
1461
|
16232
|
|
|
|
|
30966
|
$parent_origin = $postdot_item |
|
1462
|
|
|
|
|
|
|
->[Marpa::PP::Internal::Earley_Item::ORIGIN]; |
|
1463
|
|
|
|
|
|
|
} ## end else [ if ($postdot_item_is_leo) ] |
|
1464
|
|
|
|
|
|
|
|
|
1465
|
|
|
|
|
|
|
TRANSITION_STATE: |
|
1466
|
18060
|
|
|
|
|
46056
|
for my $transition_state (@transition_states) { |
|
1467
|
20010
|
|
|
|
|
33077
|
my $reset = $transition_state |
|
1468
|
|
|
|
|
|
|
->[Marpa::PP::Internal::AHFA::RESET_ORIGIN]; |
|
1469
|
20010
|
100
|
|
|
|
47321
|
my $origin = |
|
1470
|
|
|
|
|
|
|
$reset |
|
1471
|
|
|
|
|
|
|
? $earleme_to_complete |
|
1472
|
|
|
|
|
|
|
: $parent_origin; |
|
1473
|
20010
|
|
|
|
|
57039
|
my $transition_state_id = |
|
1474
|
|
|
|
|
|
|
$transition_state->[Marpa::PP::Internal::AHFA::ID]; |
|
1475
|
20010
|
|
|
|
|
61648
|
my $name = sprintf |
|
1476
|
|
|
|
|
|
|
'S%d@%d-%d', |
|
1477
|
|
|
|
|
|
|
$transition_state_id, $origin, $earleme_to_complete; |
|
1478
|
20010
|
|
|
|
|
38167
|
my $hash_key = join q{:}, $transition_state_id, $origin; |
|
1479
|
20010
|
|
|
|
|
33123
|
my $target_item = $earley_hash->{$hash_key}; |
|
1480
|
20010
|
100
|
|
|
|
51711
|
if ( not defined $target_item ) { |
|
1481
|
14231
|
|
|
|
|
40622
|
$target_item = []; |
|
1482
|
14231
|
|
|
|
|
34399
|
$target_item->[Marpa::PP::Internal::Earley_Item::ID] = |
|
1483
|
|
|
|
|
|
|
$recce->[ |
|
1484
|
|
|
|
|
|
|
Marpa::PP::Internal::Recognizer::NEXT_EARLEY_ITEM_ID |
|
1485
|
|
|
|
|
|
|
]++; |
|
1486
|
14231
|
|
|
|
|
20784
|
$target_item |
|
1487
|
|
|
|
|
|
|
->[Marpa::PP::Internal::Earley_Item::STATE] = |
|
1488
|
|
|
|
|
|
|
$transition_state; |
|
1489
|
14231
|
|
|
|
|
35337
|
$target_item |
|
1490
|
|
|
|
|
|
|
->[Marpa::PP::Internal::Earley_Item::ORIGIN] = |
|
1491
|
|
|
|
|
|
|
$origin; |
|
1492
|
14231
|
|
|
|
|
40114
|
$target_item |
|
1493
|
|
|
|
|
|
|
->[Marpa::PP::Internal::Earley_Item::LEO_LINKS] = |
|
1494
|
|
|
|
|
|
|
[]; |
|
1495
|
14231
|
|
|
|
|
34730
|
$target_item |
|
1496
|
|
|
|
|
|
|
->[Marpa::PP::Internal::Earley_Item::LINKS] = []; |
|
1497
|
14231
|
|
|
|
|
26407
|
$target_item->[Marpa::PP::Internal::Earley_Item::SET] |
|
1498
|
|
|
|
|
|
|
= $earleme_to_complete; |
|
1499
|
14231
|
|
|
|
|
66039
|
$earley_hash->{$hash_key} = $target_item; |
|
1500
|
14231
|
|
|
|
|
16800
|
push @{$earley_items}, $target_item; |
|
|
14231
|
|
|
|
|
40998
|
|
|
1501
|
|
|
|
|
|
|
} # unless defined $target_item |
|
1502
|
20010
|
100
|
|
|
|
68219
|
next TRANSITION_STATE if $reset; |
|
1503
|
18060
|
100
|
|
|
|
42537
|
if ($postdot_item_is_leo) { |
|
1504
|
1828
|
|
|
|
|
10434
|
push @{ |
|
1505
|
1828
|
|
|
|
|
2255
|
$target_item->[ |
|
1506
|
|
|
|
|
|
|
Marpa::PP::Internal::Earley_Item::LEO_LINKS |
|
1507
|
|
|
|
|
|
|
] |
|
1508
|
|
|
|
|
|
|
}, |
|
1509
|
|
|
|
|
|
|
[ $postdot_item, $earley_item, $lhs_symbol ]; |
|
1510
|
|
|
|
|
|
|
|
|
1511
|
|
|
|
|
|
|
# If we do the Leo item, do *ONLY* the Leo item |
|
1512
|
1828
|
|
|
|
|
15463
|
last PARENT_ITEM; |
|
1513
|
|
|
|
|
|
|
} ## end if ($postdot_item_is_leo) |
|
1514
|
|
|
|
|
|
|
else { |
|
1515
|
16232
|
|
|
|
|
19523
|
push @{ $target_item |
|
|
16232
|
|
|
|
|
145439
|
|
|
1516
|
|
|
|
|
|
|
->[Marpa::PP::Internal::Earley_Item::LINKS] }, |
|
1517
|
|
|
|
|
|
|
[ $postdot_item, $earley_item, $lhs_symbol ]; |
|
1518
|
|
|
|
|
|
|
} |
|
1519
|
|
|
|
|
|
|
} # TRANSITION_STATE |
|
1520
|
|
|
|
|
|
|
|
|
1521
|
|
|
|
|
|
|
} # PARENT_ITEM |
|
1522
|
|
|
|
|
|
|
} # LHS_SYMBOL |
|
1523
|
|
|
|
|
|
|
|
|
1524
|
|
|
|
|
|
|
} # EARLEY_ITEM |
|
1525
|
|
|
|
|
|
|
|
|
1526
|
22048
|
50
|
33
|
|
|
76289
|
if ( $too_many_earley_items >= 0 |
|
|
22048
|
|
|
|
|
110119
|
|
|
1527
|
|
|
|
|
|
|
and ( my $item_count = scalar @{$earley_items} ) |
|
1528
|
|
|
|
|
|
|
>= $too_many_earley_items ) |
|
1529
|
|
|
|
|
|
|
{ |
|
1530
|
0
|
0
|
|
|
|
0
|
if ( $recce->[Marpa::PP::Internal::Recognizer::WARNINGS] ) { |
|
1531
|
0
|
0
|
|
|
|
0
|
say {$Marpa::PP::Internal::TRACE_FH} |
|
|
0
|
|
|
|
|
0
|
|
|
1532
|
|
|
|
|
|
|
"Very large earley set: $item_count items at location $earleme_to_complete" |
|
1533
|
|
|
|
|
|
|
or Marpa::PP::exception("Cannot print: $ERRNO"); |
|
1534
|
|
|
|
|
|
|
} |
|
1535
|
|
|
|
|
|
|
} ## end if ( $too_many_earley_items >= 0 and ( my $item_count...)) |
|
1536
|
|
|
|
|
|
|
|
|
1537
|
|
|
|
|
|
|
# Each possible cause |
|
1538
|
|
|
|
|
|
|
# link is only visited once. |
|
1539
|
|
|
|
|
|
|
# It may be paired with several different predecessors. |
|
1540
|
|
|
|
|
|
|
# The cause may complete several different LHS symbols |
|
1541
|
|
|
|
|
|
|
# and Marpa::PP will seek predecessors for each at |
|
1542
|
|
|
|
|
|
|
# the parent location. |
|
1543
|
|
|
|
|
|
|
# Different completed LHS symbols might be postdot |
|
1544
|
|
|
|
|
|
|
# symbols for the same predecessor Earley item. |
|
1545
|
|
|
|
|
|
|
# For this reason, |
|
1546
|
|
|
|
|
|
|
# predecessor-cause pairs might not be unique |
|
1547
|
|
|
|
|
|
|
# within an Earley item. |
|
1548
|
|
|
|
|
|
|
# |
|
1549
|
|
|
|
|
|
|
# This is not an issue for unambiguous parsing. |
|
1550
|
|
|
|
|
|
|
# It *IS* an issue for iterating ambiguous parses. |
|
1551
|
|
|
|
|
|
|
|
|
1552
|
22048
|
50
|
|
|
|
51095
|
if ($trace_earley_sets) { |
|
1553
|
0
|
0
|
|
|
|
0
|
print {$Marpa::PP::Internal::TRACE_FH} |
|
|
0
|
|
|
|
|
0
|
|
|
1554
|
|
|
|
|
|
|
"=== Earley set $earleme_to_complete\n" |
|
1555
|
|
|
|
|
|
|
or Marpa::PP::exception("Cannot print: $ERRNO"); |
|
1556
|
0
|
0
|
|
|
|
0
|
print {$Marpa::PP::Internal::TRACE_FH} |
|
|
0
|
|
|
|
|
0
|
|
|
1557
|
|
|
|
|
|
|
Marpa::PP::show_earley_set($earley_set) |
|
1558
|
|
|
|
|
|
|
or Marpa::PP::exception("Cannot print: $ERRNO"); |
|
1559
|
|
|
|
|
|
|
} ## end if ($trace_earley_sets) |
|
1560
|
|
|
|
|
|
|
|
|
1561
|
22048
|
|
|
|
|
33837
|
for my $earley_item ( @{$earley_items} ) { |
|
|
22048
|
|
|
|
|
51848
|
|
|
1562
|
17267
|
|
|
|
|
40452
|
my $state = $earley_item->[Marpa::PP::Internal::Earley_Item::STATE]; |
|
1563
|
17267
|
|
|
|
|
34102
|
my $parent = $earley_item->[Marpa::PP::Internal::Earley_Item::ORIGIN]; |
|
1564
|
17267
|
|
|
|
|
17551
|
for my $postdot_symbol_name ( |
|
|
17267
|
|
|
|
|
68170
|
|
|
1565
|
|
|
|
|
|
|
keys %{ $state->[Marpa::PP::Internal::AHFA::TRANSITION] } ) |
|
1566
|
|
|
|
|
|
|
{ |
|
1567
|
39810
|
|
|
|
|
67315
|
push @{ $postdot_here->{$postdot_symbol_name} }, $earley_item; |
|
|
39810
|
|
|
|
|
162505
|
|
|
1568
|
|
|
|
|
|
|
} |
|
1569
|
|
|
|
|
|
|
} ## end for my $earley_item ( @{$earley_items} ) |
|
1570
|
|
|
|
|
|
|
|
|
1571
|
|
|
|
|
|
|
# Create the unpopulated Leo items, and put them into a worklist |
|
1572
|
22048
|
|
|
|
|
42888
|
my @leo_worklist = (); |
|
1573
|
22048
|
100
|
|
|
|
62727
|
if ( $recce->[Marpa::PP::Internal::Recognizer::USE_LEO] ) { |
|
1574
|
21978
|
|
|
|
|
53949
|
SYMBOL: for my $postdot_symbol_name ( keys %{$postdot_here} ) { |
|
|
21978
|
|
|
|
|
101338
|
|
|
1575
|
37009
|
|
|
|
|
58235
|
my $postdot_data = $postdot_here->{$postdot_symbol_name}; |
|
1576
|
37009
|
100
|
|
|
|
46727
|
next SYMBOL if scalar @{$postdot_data} != 1; |
|
|
37009
|
|
|
|
|
110712
|
|
|
1577
|
35358
|
|
|
|
|
65637
|
my $earley_item = $postdot_data->[0]; |
|
1578
|
35358
|
|
|
|
|
152705
|
my ( $leo_lhs, $base_to_state ) = |
|
1579
|
35358
|
|
|
|
|
48673
|
@{ $earley_item->[Marpa::PP::Internal::Earley_Item::STATE] |
|
1580
|
|
|
|
|
|
|
->[Marpa::PP::Internal::AHFA::TRANSITION] |
|
1581
|
|
|
|
|
|
|
->{$postdot_symbol_name} }; |
|
1582
|
|
|
|
|
|
|
|
|
1583
|
|
|
|
|
|
|
# Only one transition in the Earley set on this symbol, |
|
1584
|
|
|
|
|
|
|
# but it is not to a Leo completion. |
|
1585
|
35358
|
100
|
|
|
|
128784
|
next SYMBOL if ref $leo_lhs; |
|
1586
|
|
|
|
|
|
|
|
|
1587
|
4934
|
|
|
|
|
19812
|
my $leo_item = bless [], $LEO_CLASS; |
|
1588
|
|
|
|
|
|
|
|
|
1589
|
|
|
|
|
|
|
# $leo_item->[Marpa::PP::Internal::Leo_Item::BASE_TO_STATE] = |
|
1590
|
|
|
|
|
|
|
# $base_to_state; |
|
1591
|
4934
|
|
|
|
|
10330
|
$leo_item->[Marpa::PP::Internal::Leo_Item::SET] = |
|
1592
|
|
|
|
|
|
|
$earleme_to_complete; |
|
1593
|
4934
|
|
|
|
|
8094
|
$leo_item->[Marpa::PP::Internal::Leo_Item::LEO_POSTDOT_SYMBOL] = |
|
1594
|
|
|
|
|
|
|
$postdot_symbol_name; |
|
1595
|
4934
|
|
|
|
|
6486
|
$leo_item->[Marpa::PP::Internal::Leo_Item::BASE] = $earley_item; |
|
1596
|
|
|
|
|
|
|
|
|
1597
|
4934
|
|
|
|
|
14014
|
unshift @{ $postdot_here->{$postdot_symbol_name} }, $leo_item; |
|
|
4934
|
|
|
|
|
11626
|
|
|
1598
|
4934
|
|
|
|
|
12723
|
push @leo_worklist, $postdot_symbol_name; |
|
1599
|
|
|
|
|
|
|
|
|
1600
|
|
|
|
|
|
|
} ## end for my $postdot_symbol_name ( keys %{$postdot_here} ) |
|
1601
|
|
|
|
|
|
|
} ## end if ( $recce->[Marpa::PP::Internal::Recognizer::USE_LEO...]) |
|
1602
|
|
|
|
|
|
|
|
|
1603
|
22048
|
|
|
|
|
70818
|
POSTDOT_SYMBOL: for my $postdot_symbol_name (@leo_worklist) { |
|
1604
|
|
|
|
|
|
|
|
|
1605
|
4934
|
|
|
|
|
9682
|
my $leo_item = $postdot_here->{$postdot_symbol_name}->[0]; |
|
1606
|
|
|
|
|
|
|
next POSTDOT_SYMBOL |
|
1607
|
|
|
|
|
|
|
if |
|
1608
|
4934
|
100
|
|
|
|
12538
|
defined $leo_item->[Marpa::PP::Internal::Leo_Item::TOP_TO_STATE]; |
|
1609
|
|
|
|
|
|
|
|
|
1610
|
|
|
|
|
|
|
# Find the predecessor LIM |
|
1611
|
3887
|
|
|
|
|
4613
|
my $base_earley_item = |
|
1612
|
|
|
|
|
|
|
$leo_item->[Marpa::PP::Internal::Leo_Item::BASE]; |
|
1613
|
3887
|
|
|
|
|
6389
|
my $base_origin = |
|
1614
|
|
|
|
|
|
|
$base_earley_item->[Marpa::PP::Internal::Earley_Item::ORIGIN]; |
|
1615
|
3887
|
|
|
|
|
10735
|
my ( $leo_transition_symbol, $top_to_state ) = |
|
1616
|
3887
|
|
|
|
|
5797
|
@{ $base_earley_item->[Marpa::PP::Internal::Earley_Item::STATE] |
|
1617
|
|
|
|
|
|
|
->[Marpa::PP::Internal::AHFA::TRANSITION] |
|
1618
|
|
|
|
|
|
|
->{$postdot_symbol_name} }; |
|
1619
|
3887
|
|
|
|
|
8024
|
my $predecessor_postdot = |
|
1620
|
|
|
|
|
|
|
$earley_set_list->[$base_origin] |
|
1621
|
|
|
|
|
|
|
->[Marpa::PP::Internal::Earley_Set::POSTDOT] |
|
1622
|
|
|
|
|
|
|
->{$leo_transition_symbol}; |
|
1623
|
3887
|
|
|
|
|
17640
|
my $first_postdot_item = $predecessor_postdot->[0]; |
|
1624
|
3887
|
100
|
|
|
|
10965
|
my $predecessor_leo_item = |
|
1625
|
|
|
|
|
|
|
ref $first_postdot_item eq $LEO_CLASS |
|
1626
|
|
|
|
|
|
|
? $first_postdot_item |
|
1627
|
|
|
|
|
|
|
: undef; |
|
1628
|
|
|
|
|
|
|
|
|
1629
|
|
|
|
|
|
|
# If there is a predecessor Leo item and it is populated, populate from the predecessor |
|
1630
|
|
|
|
|
|
|
# Leo item |
|
1631
|
3887
|
100
|
|
|
|
8065
|
my $predecessor_top_to_state = |
|
1632
|
|
|
|
|
|
|
defined $predecessor_leo_item |
|
1633
|
|
|
|
|
|
|
? $predecessor_leo_item |
|
1634
|
|
|
|
|
|
|
->[Marpa::PP::Internal::Leo_Item::TOP_TO_STATE] |
|
1635
|
|
|
|
|
|
|
: undef; |
|
1636
|
3887
|
100
|
|
|
|
27323
|
if ( defined $predecessor_top_to_state ) { |
|
1637
|
1514
|
|
|
|
|
2320
|
$leo_item->[Marpa::PP::Internal::Leo_Item::PREDECESSOR] = |
|
1638
|
|
|
|
|
|
|
$predecessor_leo_item; |
|
1639
|
1514
|
|
|
|
|
2661
|
$leo_item->[Marpa::PP::Internal::Leo_Item::TOP_TO_STATE] = |
|
1640
|
|
|
|
|
|
|
$predecessor_top_to_state; |
|
1641
|
1514
|
|
|
|
|
3399
|
$leo_item->[Marpa::PP::Internal::Leo_Item::ORIGIN] = |
|
1642
|
|
|
|
|
|
|
$predecessor_leo_item |
|
1643
|
|
|
|
|
|
|
->[Marpa::PP::Internal::Leo_Item::ORIGIN]; |
|
1644
|
1514
|
|
|
|
|
12354
|
next POSTDOT_SYMBOL; |
|
1645
|
|
|
|
|
|
|
} ## end if ( defined $predecessor_top_to_state ) |
|
1646
|
|
|
|
|
|
|
|
|
1647
|
|
|
|
|
|
|
# If there is no predecessor Leo item, populate from the base Earley item |
|
1648
|
2373
|
100
|
|
|
|
5543
|
if ( not defined $predecessor_leo_item ) { |
|
1649
|
1619
|
|
|
|
|
3433
|
$leo_item->[Marpa::PP::Internal::Leo_Item::ORIGIN] = $base_origin; |
|
1650
|
1619
|
|
|
|
|
3286
|
$leo_item->[Marpa::PP::Internal::Leo_Item::TOP_TO_STATE] = |
|
1651
|
|
|
|
|
|
|
$top_to_state; |
|
1652
|
1619
|
|
|
|
|
4060
|
next POSTDOT_SYMBOL; |
|
1653
|
|
|
|
|
|
|
} ## end if ( not defined $predecessor_leo_item ) |
|
1654
|
|
|
|
|
|
|
|
|
1655
|
|
|
|
|
|
|
# If there is a predecessor, but it is not populated, we need to build a |
|
1656
|
|
|
|
|
|
|
# predecessor chain of Leo items |
|
1657
|
754
|
|
|
|
|
13887
|
my @leo_chain = ($postdot_symbol_name); |
|
1658
|
754
|
|
|
|
|
906
|
BUILD_LEO_CHAIN: while (1) { |
|
1659
|
1047
|
|
|
|
|
1330
|
my $chain_leo_item = $predecessor_leo_item; |
|
1660
|
1047
|
|
|
|
|
1683
|
my $chain_leo_transition_symbol = $chain_leo_item |
|
1661
|
|
|
|
|
|
|
->[Marpa::PP::Internal::Leo_Item::LEO_POSTDOT_SYMBOL]; |
|
1662
|
|
|
|
|
|
|
|
|
1663
|
|
|
|
|
|
|
# If this leo item is already on the chain, break here. |
|
1664
|
|
|
|
|
|
|
# The predecessor Leo item has not yet been updated |
|
1665
|
|
|
|
|
|
|
# (it and the current Leo item are the same) |
|
1666
|
|
|
|
|
|
|
# so the predecessor Leo item |
|
1667
|
|
|
|
|
|
|
# is still correct for the Leo item at the top of the |
|
1668
|
|
|
|
|
|
|
# Leo item chain. |
|
1669
|
|
|
|
|
|
|
last BUILD_LEO_CHAIN |
|
1670
|
1047
|
50
|
|
|
|
4310
|
if $chain_leo_transition_symbol ~~ @leo_chain; |
|
1671
|
|
|
|
|
|
|
|
|
1672
|
|
|
|
|
|
|
# Find the new predecessor Leo item |
|
1673
|
1047
|
|
|
|
|
1498
|
my $chain_base_earley_item = |
|
1674
|
|
|
|
|
|
|
$chain_leo_item->[Marpa::PP::Internal::Leo_Item::BASE]; |
|
1675
|
1047
|
|
|
|
|
14210
|
my $chain_base_origin = $chain_base_earley_item |
|
1676
|
|
|
|
|
|
|
->[Marpa::PP::Internal::Earley_Item::ORIGIN]; |
|
1677
|
1047
|
|
|
|
|
3491
|
my ( $chain_predecessor_leo_transition_symbol, |
|
1678
|
|
|
|
|
|
|
$chain_top_to_state ) |
|
1679
|
1047
|
|
|
|
|
1239
|
= @{ $chain_base_earley_item |
|
1680
|
|
|
|
|
|
|
->[Marpa::PP::Internal::Earley_Item::STATE] |
|
1681
|
|
|
|
|
|
|
->[Marpa::PP::Internal::AHFA::TRANSITION] |
|
1682
|
|
|
|
|
|
|
->{$chain_leo_transition_symbol} }; |
|
1683
|
1047
|
|
|
|
|
2248
|
my $chain_predecessor_postdot = |
|
1684
|
|
|
|
|
|
|
$earley_set_list->[$chain_base_origin] |
|
1685
|
|
|
|
|
|
|
->[Marpa::PP::Internal::Earley_Set::POSTDOT] |
|
1686
|
|
|
|
|
|
|
->{$chain_predecessor_leo_transition_symbol}; |
|
1687
|
1047
|
|
|
|
|
1416
|
my $chain_first_postdot_item = $chain_predecessor_postdot->[0]; |
|
1688
|
1047
|
100
|
|
|
|
2762
|
$predecessor_leo_item = |
|
1689
|
|
|
|
|
|
|
ref $chain_first_postdot_item eq $LEO_CLASS |
|
1690
|
|
|
|
|
|
|
? $chain_first_postdot_item |
|
1691
|
|
|
|
|
|
|
: undef; |
|
1692
|
|
|
|
|
|
|
|
|
1693
|
1047
|
|
|
|
|
1681
|
push @leo_chain, $chain_leo_transition_symbol; |
|
1694
|
|
|
|
|
|
|
|
|
1695
|
|
|
|
|
|
|
# No predecessor, so I am forced to break the Leo chain here. |
|
1696
|
1047
|
100
|
|
|
|
3535
|
last BUILD_LEO_CHAIN if not defined $predecessor_leo_item; |
|
1697
|
|
|
|
|
|
|
|
|
1698
|
|
|
|
|
|
|
# A populated predecessor, so I can fully populate the Leo chain. |
|
1699
|
|
|
|
|
|
|
# Break the Leo chain here. |
|
1700
|
|
|
|
|
|
|
last BUILD_LEO_CHAIN |
|
1701
|
458
|
100
|
|
|
|
1722
|
if defined $predecessor_leo_item |
|
1702
|
|
|
|
|
|
|
->[Marpa::PP::Internal::Leo_Item::TOP_TO_STATE]; |
|
1703
|
|
|
|
|
|
|
} ## end while (1) |
|
1704
|
|
|
|
|
|
|
|
|
1705
|
754
|
|
|
|
|
2270
|
while ( my $chain_leo_transition_symbol = pop @leo_chain ) { |
|
1706
|
1801
|
|
|
|
|
3200
|
my $chain_leo_item = |
|
1707
|
|
|
|
|
|
|
$postdot_here->{$chain_leo_transition_symbol}->[0]; |
|
1708
|
|
|
|
|
|
|
|
|
1709
|
|
|
|
|
|
|
# If there is a predecessor Leo item and it is populated, populate from the predecessor |
|
1710
|
|
|
|
|
|
|
# Leo item |
|
1711
|
1801
|
100
|
|
|
|
3559
|
my $chain_predecessor_top_to_state = |
|
1712
|
|
|
|
|
|
|
$predecessor_leo_item |
|
1713
|
|
|
|
|
|
|
? $predecessor_leo_item |
|
1714
|
|
|
|
|
|
|
->[Marpa::PP::Internal::Leo_Item::TOP_TO_STATE] |
|
1715
|
|
|
|
|
|
|
: undef; |
|
1716
|
1801
|
100
|
|
|
|
3739
|
if ( defined $chain_predecessor_top_to_state ) { |
|
1717
|
1212
|
|
|
|
|
1950
|
$chain_leo_item->[Marpa::PP::Internal::Leo_Item::PREDECESSOR] |
|
1718
|
|
|
|
|
|
|
= $predecessor_leo_item; |
|
1719
|
1212
|
|
|
|
|
2485
|
$chain_leo_item->[Marpa::PP::Internal::Leo_Item::TOP_TO_STATE] |
|
1720
|
|
|
|
|
|
|
= $chain_predecessor_top_to_state; |
|
1721
|
1212
|
|
|
|
|
2633
|
$chain_leo_item->[Marpa::PP::Internal::Leo_Item::ORIGIN] = |
|
1722
|
|
|
|
|
|
|
$predecessor_leo_item |
|
1723
|
|
|
|
|
|
|
->[Marpa::PP::Internal::Leo_Item::ORIGIN]; |
|
1724
|
|
|
|
|
|
|
} ## end if ( defined $chain_predecessor_top_to_state ) |
|
1725
|
|
|
|
|
|
|
else { |
|
1726
|
589
|
|
|
|
|
1252
|
my $chain_base_earley_item = |
|
1727
|
|
|
|
|
|
|
$chain_leo_item->[Marpa::PP::Internal::Leo_Item::BASE]; |
|
1728
|
589
|
|
|
|
|
1090
|
my $chain_base_origin = $chain_base_earley_item |
|
1729
|
|
|
|
|
|
|
->[Marpa::PP::Internal::Earley_Item::ORIGIN]; |
|
1730
|
589
|
|
|
|
|
1477
|
my ( undef, $chain_top_to_state ) = |
|
1731
|
589
|
|
|
|
|
9406
|
@{ $chain_base_earley_item |
|
1732
|
|
|
|
|
|
|
->[Marpa::PP::Internal::Earley_Item::STATE] |
|
1733
|
|
|
|
|
|
|
->[Marpa::PP::Internal::AHFA::TRANSITION] |
|
1734
|
|
|
|
|
|
|
->{$chain_leo_transition_symbol} }; |
|
1735
|
589
|
|
|
|
|
1653
|
$chain_leo_item->[Marpa::PP::Internal::Leo_Item::ORIGIN] = |
|
1736
|
|
|
|
|
|
|
$chain_base_origin; |
|
1737
|
589
|
|
|
|
|
1522
|
$chain_leo_item->[Marpa::PP::Internal::Leo_Item::TOP_TO_STATE] |
|
1738
|
|
|
|
|
|
|
= $chain_top_to_state; |
|
1739
|
|
|
|
|
|
|
} ## end else [ if ( defined $chain_predecessor_top_to_state ) ] |
|
1740
|
1801
|
|
|
|
|
16292
|
$predecessor_leo_item = $chain_leo_item; |
|
1741
|
|
|
|
|
|
|
} ## end while ( my $chain_leo_transition_symbol = pop @leo_chain) |
|
1742
|
|
|
|
|
|
|
} ## end for my $postdot_symbol_name (@leo_worklist) |
|
1743
|
|
|
|
|
|
|
|
|
1744
|
37209
|
|
|
|
|
106936
|
my @terminals_expected = |
|
1745
|
22048
|
|
|
|
|
43075
|
grep { $terminal_names->{$_} } keys %{$postdot_here}; |
|
|
22048
|
|
|
|
|
59926
|
|
|
1746
|
22048
|
|
|
|
|
51880
|
$recce->[Marpa::PP::Internal::Recognizer::EXPECTED_TERMINALS] = |
|
1747
|
|
|
|
|
|
|
\@terminals_expected; |
|
1748
|
|
|
|
|
|
|
|
|
1749
|
22048
|
|
100
|
|
|
116221
|
$recce->[Marpa::PP::Internal::Recognizer::EXHAUSTED] = |
|
1750
|
|
|
|
|
|
|
( scalar @terminals_expected <= 0 ) |
|
1751
|
|
|
|
|
|
|
&& $earleme_to_complete |
|
1752
|
|
|
|
|
|
|
>= $recce->[Marpa::PP::Internal::Recognizer::FURTHEST_EARLEME]; |
|
1753
|
|
|
|
|
|
|
|
|
1754
|
22048
|
100
|
|
|
|
57546
|
if ( $trace_terminals > 1 ) { |
|
1755
|
3
|
|
|
|
|
7
|
for my $terminal ( sort @terminals_expected ) { |
|
1756
|
4
|
50
|
|
|
|
5
|
say {$Marpa::PP::Internal::TRACE_FH} |
|
|
4
|
|
|
|
|
26
|
|
|
1757
|
|
|
|
|
|
|
qq{Expecting "$terminal" at $earleme_to_complete} |
|
1758
|
|
|
|
|
|
|
or Marpa::PP::exception("Cannot print: $ERRNO"); |
|
1759
|
|
|
|
|
|
|
} |
|
1760
|
|
|
|
|
|
|
} ## end if ( $trace_terminals > 1 ) |
|
1761
|
|
|
|
|
|
|
|
|
1762
|
22048
|
100
|
|
|
|
32069
|
if ( scalar @{$earley_items} > 0 ) { |
|
|
22048
|
|
|
|
|
83161
|
|
|
1763
|
1906
|
|
|
|
|
3504
|
my $ordinal = |
|
1764
|
|
|
|
|
|
|
$recce->[Marpa::PP::Internal::Recognizer::NEXT_ORDINAL]++; |
|
1765
|
1906
|
|
|
|
|
3417
|
$earley_set->[Marpa::PP::Internal::Earley_Set::ORDINAL] = $ordinal; |
|
1766
|
1906
|
|
|
|
|
4311
|
$recce->[Marpa::PP::Internal::Recognizer::EARLEY_SETS_BY_ORDINAL] |
|
1767
|
|
|
|
|
|
|
->[$ordinal] = $earley_set; |
|
1768
|
|
|
|
|
|
|
} ## end if ( scalar @{$earley_items} > 0 ) |
|
1769
|
|
|
|
|
|
|
|
|
1770
|
22048
|
|
|
|
|
87362
|
return scalar @terminals_expected; |
|
1771
|
|
|
|
|
|
|
|
|
1772
|
|
|
|
|
|
|
} ## end sub Marpa::PP::Recognizer::earleme_complete |
|
1773
|
|
|
|
|
|
|
|
|
1774
|
|
|
|
|
|
|
1; |