line |
stmt |
bran |
cond |
sub |
pod |
time |
code |
1
|
|
|
|
|
|
|
# /=====================================================================\ # |
2
|
|
|
|
|
|
|
# | LaTeXML | # |
3
|
|
|
|
|
|
|
# | Core Module for TeX conversion | # |
4
|
|
|
|
|
|
|
# |=====================================================================| # |
5
|
|
|
|
|
|
|
# | Part of LaTeXML: | # |
6
|
|
|
|
|
|
|
# | Public domain software, produced as part of work done by the | # |
7
|
|
|
|
|
|
|
# | United States Government & not subject to copyright in the US. | # |
8
|
|
|
|
|
|
|
# |---------------------------------------------------------------------| # |
9
|
|
|
|
|
|
|
# | Bruce Miller #_# | # |
10
|
|
|
|
|
|
|
# | http://dlmf.nist.gov/LaTeXML/ (o o) | # |
11
|
|
|
|
|
|
|
# \=========================================================ooo==U==ooo=/ # |
12
|
|
|
|
|
|
|
|
13
|
|
|
|
|
|
|
package LaTeXML::Core; |
14
|
21
|
|
|
21
|
|
72
|
use strict; |
|
21
|
|
|
|
|
28
|
|
|
21
|
|
|
|
|
510
|
|
15
|
21
|
|
|
21
|
|
67
|
use warnings; |
|
21
|
|
|
|
|
23
|
|
|
21
|
|
|
|
|
497
|
|
16
|
21
|
|
|
21
|
|
6467
|
use LaTeXML::Global; |
|
21
|
|
|
|
|
33
|
|
|
21
|
|
|
|
|
1865
|
|
17
|
|
|
|
|
|
|
#use LaTeXML::Common::Object; |
18
|
21
|
|
|
21
|
|
8231
|
use LaTeXML::Common::Error; |
|
0
|
|
|
|
|
|
|
|
0
|
|
|
|
|
|
|
19
|
|
|
|
|
|
|
use LaTeXML::Core::State; |
20
|
|
|
|
|
|
|
use LaTeXML::Core::Token; |
21
|
|
|
|
|
|
|
use LaTeXML::Core::Tokens; |
22
|
|
|
|
|
|
|
use LaTeXML::Core::Stomach; |
23
|
|
|
|
|
|
|
use LaTeXML::Core::Document; |
24
|
|
|
|
|
|
|
use LaTeXML::Common::Model; |
25
|
|
|
|
|
|
|
use LaTeXML::MathParser; |
26
|
|
|
|
|
|
|
use LaTeXML::Util::Pathname; |
27
|
|
|
|
|
|
|
use LaTeXML::Pre::BibTeX; |
28
|
|
|
|
|
|
|
use LaTeXML::Package; # !!!! |
29
|
|
|
|
|
|
|
use LaTeXML::Version; |
30
|
|
|
|
|
|
|
use Encode; |
31
|
|
|
|
|
|
|
use FindBin; |
32
|
|
|
|
|
|
|
use base qw(LaTeXML::Common::Object); |
33
|
|
|
|
|
|
|
|
34
|
|
|
|
|
|
|
#********************************************************************** |
35
|
|
|
|
|
|
|
|
36
|
|
|
|
|
|
|
sub new { |
37
|
|
|
|
|
|
|
my ($class, %options) = @_; |
38
|
|
|
|
|
|
|
my $state = LaTeXML::Core::State->new(catcodes => 'standard', |
39
|
|
|
|
|
|
|
stomach => LaTeXML::Core::Stomach->new(), |
40
|
|
|
|
|
|
|
model => $options{model} || LaTeXML::Common::Model->new()); |
41
|
|
|
|
|
|
|
$state->assignValue(VERBOSITY => (defined $options{verbosity} ? $options{verbosity} : 0), |
42
|
|
|
|
|
|
|
'global'); |
43
|
|
|
|
|
|
|
$state->assignValue(STRICT => (defined $options{strict} ? $options{strict} : 0), |
44
|
|
|
|
|
|
|
'global'); |
45
|
|
|
|
|
|
|
$state->assignValue(INCLUDE_COMMENTS => (defined $options{includeComments} ? $options{includeComments} : 1), |
46
|
|
|
|
|
|
|
'global'); |
47
|
|
|
|
|
|
|
$state->assignValue(DOCUMENTID => (defined $options{documentid} ? $options{documentid} : ''), |
48
|
|
|
|
|
|
|
'global'); |
49
|
|
|
|
|
|
|
$state->assignValue(SEARCHPATHS => [map { pathname_absolute(pathname_canonical($_)) } |
50
|
|
|
|
|
|
|
@{ $options{searchpaths} || [] }], |
51
|
|
|
|
|
|
|
'global'); |
52
|
|
|
|
|
|
|
$state->assignValue(GRAPHICSPATHS => [map { pathname_absolute(pathname_canonical($_)) } |
53
|
|
|
|
|
|
|
@{ $options{graphicspaths} || [] }], 'global'); |
54
|
|
|
|
|
|
|
$state->assignValue(INCLUDE_STYLES => $options{includeStyles} || 0, 'global'); |
55
|
|
|
|
|
|
|
$state->assignValue(PERL_INPUT_ENCODING => $options{inputencoding}) if $options{inputencoding}; |
56
|
|
|
|
|
|
|
$state->assignValue(NOMATHPARSE => $options{nomathparse} || 0, 'global'); |
57
|
|
|
|
|
|
|
return bless { state => $state, |
58
|
|
|
|
|
|
|
nomathparse => $options{nomathparse} || 0, |
59
|
|
|
|
|
|
|
preload => $options{preload}, |
60
|
|
|
|
|
|
|
}, $class; } |
61
|
|
|
|
|
|
|
|
62
|
|
|
|
|
|
|
#%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% |
63
|
|
|
|
|
|
|
# High-level API. |
64
|
|
|
|
|
|
|
|
65
|
|
|
|
|
|
|
sub convertAndWriteFile { |
66
|
|
|
|
|
|
|
my ($self, $file) = @_; |
67
|
|
|
|
|
|
|
$file =~ s/\.tex$//; |
68
|
|
|
|
|
|
|
my $dom = $self->convertFile($file); |
69
|
|
|
|
|
|
|
$dom->toFile("$file.xml", 1) if $dom; |
70
|
|
|
|
|
|
|
return $dom; } |
71
|
|
|
|
|
|
|
|
72
|
|
|
|
|
|
|
sub convertFile { |
73
|
|
|
|
|
|
|
my ($self, $file) = @_; |
74
|
|
|
|
|
|
|
my $digested = $self->digestFile($file); |
75
|
|
|
|
|
|
|
return unless $digested; |
76
|
|
|
|
|
|
|
return $self->convertDocument($digested); } |
77
|
|
|
|
|
|
|
|
78
|
|
|
|
|
|
|
sub getStatusMessage { |
79
|
|
|
|
|
|
|
my ($self) = @_; |
80
|
|
|
|
|
|
|
return $$self{state}->getStatusMessage; } |
81
|
|
|
|
|
|
|
|
82
|
|
|
|
|
|
|
sub getStatusCode { |
83
|
|
|
|
|
|
|
my ($self) = @_; |
84
|
|
|
|
|
|
|
return $$self{state}->getStatusCode; } |
85
|
|
|
|
|
|
|
|
86
|
|
|
|
|
|
|
# You'd typically do this after both digestion AND conversion... |
87
|
|
|
|
|
|
|
sub showProfile { |
88
|
|
|
|
|
|
|
my ($self, $digested) = @_; |
89
|
|
|
|
|
|
|
return |
90
|
|
|
|
|
|
|
$self->withState(sub { |
91
|
|
|
|
|
|
|
LaTeXML::Core::Definition::showProfile(); # Show profile (if any) |
92
|
|
|
|
|
|
|
}); } |
93
|
|
|
|
|
|
|
|
94
|
|
|
|
|
|
|
#%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% |
95
|
|
|
|
|
|
|
# Mid-level API. |
96
|
|
|
|
|
|
|
|
97
|
|
|
|
|
|
|
# options are currently being evolved to accomodate the Daemon: |
98
|
|
|
|
|
|
|
# mode : the processing mode, ie the pool to preload: TeX or BibTeX |
99
|
|
|
|
|
|
|
# noinitialize : if defined, it does not initialize State. |
100
|
|
|
|
|
|
|
# preamble = names a tex file (or standard_preamble.tex) |
101
|
|
|
|
|
|
|
# postamble = names a tex file (or standard_postamble.tex) |
102
|
|
|
|
|
|
|
|
103
|
|
|
|
|
|
|
our %MODE_EXTENSION = ( # CONFIGURATION? |
104
|
|
|
|
|
|
|
TeX => 'tex', LaTeX => 'tex', AmSTeX => 'tex', BibTeX => 'bib'); |
105
|
|
|
|
|
|
|
|
106
|
|
|
|
|
|
|
sub digestFile { |
107
|
|
|
|
|
|
|
my ($self, $request, %options) = @_; |
108
|
|
|
|
|
|
|
my ($dir, $name, $ext); |
109
|
|
|
|
|
|
|
my $mode = $options{mode} || 'TeX'; |
110
|
|
|
|
|
|
|
if (pathname_is_literaldata($request)) { |
111
|
|
|
|
|
|
|
$dir = undef; $ext = $MODE_EXTENSION{$mode}; |
112
|
|
|
|
|
|
|
$name = "Anonymous String"; } |
113
|
|
|
|
|
|
|
elsif (pathname_is_url($request)) { |
114
|
|
|
|
|
|
|
$dir = undef; $ext = $MODE_EXTENSION{$mode}; |
115
|
|
|
|
|
|
|
$name = $request; |
116
|
|
|
|
|
|
|
} |
117
|
|
|
|
|
|
|
else { |
118
|
|
|
|
|
|
|
$request =~ s/\.\Q$MODE_EXTENSION{$mode}\E$//; |
119
|
|
|
|
|
|
|
if (my $pathname = pathname_find($request, types => [$MODE_EXTENSION{$mode}, ''])) { |
120
|
|
|
|
|
|
|
$request = $pathname; |
121
|
|
|
|
|
|
|
($dir, $name, $ext) = pathname_split($request); } |
122
|
|
|
|
|
|
|
else { |
123
|
|
|
|
|
|
|
$self->withState(sub { |
124
|
|
|
|
|
|
|
Fatal('missing_file', $request, undef, "Can't find $mode file $request"); }); } } |
125
|
|
|
|
|
|
|
return |
126
|
|
|
|
|
|
|
$self->withState(sub { |
127
|
|
|
|
|
|
|
my ($state) = @_; |
128
|
|
|
|
|
|
|
NoteBegin("Digesting $mode $name"); |
129
|
|
|
|
|
|
|
$self->initializeState($mode . ".pool", @{ $$self{preload} || [] }) unless $options{noinitialize}; |
130
|
|
|
|
|
|
|
$state->assignValue(SOURCEFILE => $request) if (!pathname_is_literaldata($request)); |
131
|
|
|
|
|
|
|
$state->assignValue(SOURCEDIRECTORY => $dir) if defined $dir; |
132
|
|
|
|
|
|
|
$state->unshiftValue(SEARCHPATHS => $dir) |
133
|
|
|
|
|
|
|
if defined $dir && !grep { $_ eq $dir } @{ $state->lookupValue('SEARCHPATHS') }; |
134
|
|
|
|
|
|
|
$state->unshiftValue(GRAPHICSPATHS => $dir) |
135
|
|
|
|
|
|
|
|
136
|
|
|
|
|
|
|
if defined $dir && !grep { $_ eq $dir } @{ $state->lookupValue('GRAPHICSPATHS') }; |
137
|
|
|
|
|
|
|
|
138
|
|
|
|
|
|
|
$state->installDefinition(LaTeXML::Core::Definition::Expandable->new(T_CS('\jobname'), undef, |
139
|
|
|
|
|
|
|
Tokens(Explode($name)))); |
140
|
|
|
|
|
|
|
# Reverse order, since last opened is first read! |
141
|
|
|
|
|
|
|
$self->loadPostamble($options{postamble}) if $options{postamble}; |
142
|
|
|
|
|
|
|
LaTeXML::Package::InputContent($request); |
143
|
|
|
|
|
|
|
$self->loadPreamble($options{preamble}) if $options{preamble}; |
144
|
|
|
|
|
|
|
|
145
|
|
|
|
|
|
|
# Now for the Hacky part for BibTeX!!! |
146
|
|
|
|
|
|
|
if ($mode eq 'BibTeX') { |
147
|
|
|
|
|
|
|
my $bib = LaTeXML::Pre::BibTeX->newFromGullet($name, $state->getStomach->getGullet); |
148
|
|
|
|
|
|
|
LaTeXML::Package::InputContent("literal:" . $bib->toTeX); } |
149
|
|
|
|
|
|
|
my $list = $self->finishDigestion; |
150
|
|
|
|
|
|
|
NoteEnd("Digesting $mode $name"); |
151
|
|
|
|
|
|
|
return $list; }); |
152
|
|
|
|
|
|
|
} |
153
|
|
|
|
|
|
|
|
154
|
|
|
|
|
|
|
sub finishDigestion { |
155
|
|
|
|
|
|
|
my ($self) = @_; |
156
|
|
|
|
|
|
|
my $state = $$self{state}; |
157
|
|
|
|
|
|
|
my $stomach = $state->getStomach; |
158
|
|
|
|
|
|
|
my @stuff = (); |
159
|
|
|
|
|
|
|
while ($stomach->getGullet->getMouth->hasMoreInput) { |
160
|
|
|
|
|
|
|
push(@stuff, $stomach->digestNextBody); } |
161
|
|
|
|
|
|
|
if (my $env = $state->lookupValue('current_environment')) { |
162
|
|
|
|
|
|
|
Error('expected', "\\end{$env}", $stomach, |
163
|
|
|
|
|
|
|
"Input ended while environment $env was open"); } |
164
|
|
|
|
|
|
|
my $ifstack = $state->lookupValue('if_stack'); |
165
|
|
|
|
|
|
|
if ($ifstack && $$ifstack[0]) { |
166
|
|
|
|
|
|
|
Error('expected', '\fi', $stomach, |
167
|
|
|
|
|
|
|
"Input ended while conditional " . ToString($$ifstack[0]{token}) . " was incomplete", |
168
|
|
|
|
|
|
|
"started at " . ToString($$ifstack[0]{start})); } |
169
|
|
|
|
|
|
|
$stomach->getGullet->flush; |
170
|
|
|
|
|
|
|
return List(@stuff); } |
171
|
|
|
|
|
|
|
|
172
|
|
|
|
|
|
|
sub loadPreamble { |
173
|
|
|
|
|
|
|
my ($self, $preamble) = @_; |
174
|
|
|
|
|
|
|
my $gullet = $$self{state}->getStomach->getGullet; |
175
|
|
|
|
|
|
|
if ($preamble eq 'standard_preamble.tex') { |
176
|
|
|
|
|
|
|
$preamble = 'literal:\documentclass{article}\begin{document}'; } |
177
|
|
|
|
|
|
|
return LaTeXML::Package::InputContent($preamble); } |
178
|
|
|
|
|
|
|
|
179
|
|
|
|
|
|
|
sub loadPostamble { |
180
|
|
|
|
|
|
|
my ($self, $postamble) = @_; |
181
|
|
|
|
|
|
|
my $gullet = $$self{state}->getStomach->getGullet; |
182
|
|
|
|
|
|
|
if ($postamble eq 'standard_postamble.tex') { |
183
|
|
|
|
|
|
|
$postamble = 'literal:\end{document}'; } |
184
|
|
|
|
|
|
|
return LaTeXML::Package::InputContent($postamble); } |
185
|
|
|
|
|
|
|
|
186
|
|
|
|
|
|
|
sub convertDocument { |
187
|
|
|
|
|
|
|
my ($self, $digested) = @_; |
188
|
|
|
|
|
|
|
return |
189
|
|
|
|
|
|
|
$self->withState(sub { |
190
|
|
|
|
|
|
|
my ($state) = @_; |
191
|
|
|
|
|
|
|
my $model = $state->getModel; # The document model. |
192
|
|
|
|
|
|
|
my $document = LaTeXML::Core::Document->new($model); |
193
|
|
|
|
|
|
|
local $LaTeXML::DOCUMENT = $document; |
194
|
|
|
|
|
|
|
NoteBegin("Building"); |
195
|
|
|
|
|
|
|
$model->loadSchema(); # If needed? |
196
|
|
|
|
|
|
|
if (my $paths = $state->lookupValue('SEARCHPATHS')) { |
197
|
|
|
|
|
|
|
if ($state->lookupValue('INCLUDE_COMMENTS')) { |
198
|
|
|
|
|
|
|
$document->insertPI('latexml', searchpaths => join(',', @$paths)); } } |
199
|
|
|
|
|
|
|
foreach my $preload (@{ $$self{preload} }) { |
200
|
|
|
|
|
|
|
next if $preload =~ /\.pool$/; |
201
|
|
|
|
|
|
|
my $options = undef; # Stupid perlcritic policy |
202
|
|
|
|
|
|
|
if ($preload =~ s/^\[([^\]]*)\]//) { $options = $1; } |
203
|
|
|
|
|
|
|
if ($preload =~ s/\.cls$//) { |
204
|
|
|
|
|
|
|
$document->insertPI('latexml', class => $preload, ($options ? (options => $options) : ())); } |
205
|
|
|
|
|
|
|
else { |
206
|
|
|
|
|
|
|
$preload =~ s/\.sty$//; |
207
|
|
|
|
|
|
|
$document->insertPI('latexml', package => $preload, ($options ? (options => $options) : ())); } } |
208
|
|
|
|
|
|
|
{ no warnings 'recursion'; |
209
|
|
|
|
|
|
|
$document->absorb($digested); } |
210
|
|
|
|
|
|
|
NoteEnd("Building"); |
211
|
|
|
|
|
|
|
|
212
|
|
|
|
|
|
|
if (my $rules = $state->lookupValue('DOCUMENT_REWRITE_RULES')) { |
213
|
|
|
|
|
|
|
NoteBegin("Rewriting"); |
214
|
|
|
|
|
|
|
$document->markXMNodeVisibility; |
215
|
|
|
|
|
|
|
foreach my $rule (@$rules) { |
216
|
|
|
|
|
|
|
$rule->rewrite($document, $document->getDocument->documentElement); } |
217
|
|
|
|
|
|
|
NoteEnd("Rewriting"); } |
218
|
|
|
|
|
|
|
|
219
|
|
|
|
|
|
|
LaTeXML::MathParser->new()->parseMath($document) unless $$self{nomathparse}; |
220
|
|
|
|
|
|
|
NoteBegin("Finalizing"); |
221
|
|
|
|
|
|
|
my $xmldoc = $document->finalize(); |
222
|
|
|
|
|
|
|
NoteEnd("Finalizing"); |
223
|
|
|
|
|
|
|
return $xmldoc; }); } |
224
|
|
|
|
|
|
|
|
225
|
|
|
|
|
|
|
sub withState { |
226
|
|
|
|
|
|
|
my ($self, $closure) = @_; |
227
|
|
|
|
|
|
|
local $STATE = $$self{state}; |
228
|
|
|
|
|
|
|
# And, set fancy error handler for ANY die! |
229
|
|
|
|
|
|
|
local $SIG{__DIE__} = \&LaTeXML::Common::Error::perl_die_handler; |
230
|
|
|
|
|
|
|
local $SIG{INT} = \&LaTeXML::Common::Error::perl_interrupt_handler; |
231
|
|
|
|
|
|
|
local $SIG{__WARN__} = \&LaTeXML::Common::Error::perl_warn_handler; |
232
|
|
|
|
|
|
|
local $SIG{'ALRM'} = \&LaTeXML::Common::Error::perl_timeout_handler; |
233
|
|
|
|
|
|
|
local $SIG{'TERM'} = \&LaTeXML::Common::Error::perl_terminate_handler; |
234
|
|
|
|
|
|
|
|
235
|
|
|
|
|
|
|
local $LaTeXML::DUAL_BRANCH = ''; |
236
|
|
|
|
|
|
|
|
237
|
|
|
|
|
|
|
return &$closure($STATE); } |
238
|
|
|
|
|
|
|
|
239
|
|
|
|
|
|
|
sub initializeState { |
240
|
|
|
|
|
|
|
my ($self, @files) = @_; |
241
|
|
|
|
|
|
|
my $state = $$self{state}; |
242
|
|
|
|
|
|
|
my $stomach = $state->getStomach; # The current Stomach; |
243
|
|
|
|
|
|
|
my $gullet = $stomach->getGullet; |
244
|
|
|
|
|
|
|
$stomach->initialize; |
245
|
|
|
|
|
|
|
my $paths = $state->lookupValue('SEARCHPATHS'); |
246
|
|
|
|
|
|
|
$state->assignValue('InitialPreloads' => 1, 'global'); |
247
|
|
|
|
|
|
|
foreach my $preload (@files) { |
248
|
|
|
|
|
|
|
my ($options, $type); |
249
|
|
|
|
|
|
|
$options = $1 if $preload =~ s/^\[([^\]]*)\]//; |
250
|
|
|
|
|
|
|
$type = ($preload =~ s/\.(\w+)$// ? $1 : 'sty'); |
251
|
|
|
|
|
|
|
my $handleoptions = ($type eq 'sty') || ($type eq 'cls'); |
252
|
|
|
|
|
|
|
if ($options) { |
253
|
|
|
|
|
|
|
if ($handleoptions) { |
254
|
|
|
|
|
|
|
$options = [split(/,/, $options)]; } |
255
|
|
|
|
|
|
|
else { |
256
|
|
|
|
|
|
|
Warn('unexpected', 'options', |
257
|
|
|
|
|
|
|
"Attempting to pass options to $preload.$type (not style or class)", |
258
|
|
|
|
|
|
|
"The options were [$options]"); } } |
259
|
|
|
|
|
|
|
# Attach extension back if HTTP protocol: |
260
|
|
|
|
|
|
|
if (pathname_is_url($preload)) { |
261
|
|
|
|
|
|
|
$preload .= '.' . $type; |
262
|
|
|
|
|
|
|
} |
263
|
|
|
|
|
|
|
LaTeXML::Package::InputDefinitions($preload, type => $type, |
264
|
|
|
|
|
|
|
handleoptions => $handleoptions, options => $options); |
265
|
|
|
|
|
|
|
} |
266
|
|
|
|
|
|
|
$state->assignValue('InitialPreloads' => undef, 'global'); |
267
|
|
|
|
|
|
|
return; } |
268
|
|
|
|
|
|
|
|
269
|
|
|
|
|
|
|
sub writeDOM { |
270
|
|
|
|
|
|
|
my ($self, $dom, $name) = @_; |
271
|
|
|
|
|
|
|
$dom->toFile("$name.xml", 1); |
272
|
|
|
|
|
|
|
return 1; } |
273
|
|
|
|
|
|
|
|
274
|
|
|
|
|
|
|
#********************************************************************** |
275
|
|
|
|
|
|
|
# Should post processing be managed from here too? |
276
|
|
|
|
|
|
|
# Problem: with current DOM setup, I pretty much have to write the |
277
|
|
|
|
|
|
|
# file and reread it anyway... |
278
|
|
|
|
|
|
|
# Also, want to inhibit loading an extreme number of classes if not needed. |
279
|
|
|
|
|
|
|
#********************************************************************** |
280
|
|
|
|
|
|
|
1; |
281
|
|
|
|
|
|
|
|
282
|
|
|
|
|
|
|
__END__ |