| line |
stmt |
bran |
cond |
sub |
pod |
time |
code |
|
1
|
|
|
|
|
|
|
package Chemistry::Mok; |
|
2
|
|
|
|
|
|
|
|
|
3
|
|
|
|
|
|
|
$VERSION = '0.25'; |
|
4
|
|
|
|
|
|
|
# $Id: Mok.pm,v 1.10 2005/05/16 21:54:21 itubert Exp $ |
|
5
|
|
|
|
|
|
|
|
|
6
|
1
|
|
|
1
|
|
100489
|
use strict; |
|
|
1
|
|
|
|
|
4
|
|
|
|
1
|
|
|
|
|
53
|
|
|
7
|
1
|
|
|
1
|
|
6
|
use warnings; |
|
|
1
|
|
|
|
|
2
|
|
|
|
1
|
|
|
|
|
40
|
|
|
8
|
1
|
|
|
1
|
|
2174
|
use Chemistry::Mol; |
|
|
1
|
|
|
|
|
55682
|
|
|
|
1
|
|
|
|
|
83
|
|
|
9
|
1
|
|
|
1
|
|
1362
|
use Chemistry::File ':auto'; |
|
|
1
|
|
|
|
|
19456
|
|
|
|
1
|
|
|
|
|
8
|
|
|
10
|
1
|
|
|
1
|
|
74412
|
use Chemistry::Pattern; |
|
|
1
|
|
|
|
|
3
|
|
|
|
1
|
|
|
|
|
68
|
|
|
11
|
1
|
|
|
1
|
|
6
|
use Chemistry::Bond::Find qw(find_bonds assign_bond_orders); |
|
|
1
|
|
|
|
|
2
|
|
|
|
1
|
|
|
|
|
66
|
|
|
12
|
1
|
|
|
1
|
|
1157
|
use Chemistry::Ring 'aromatize_mol'; |
|
|
1
|
|
|
|
|
7809
|
|
|
|
1
|
|
|
|
|
80
|
|
|
13
|
1
|
|
|
1
|
|
2232
|
use Chemistry::3DBuilder 'build_3d'; |
|
|
0
|
|
|
|
|
|
|
|
|
0
|
|
|
|
|
|
|
|
14
|
|
|
|
|
|
|
use Text::Balanced ':ALL'; |
|
15
|
|
|
|
|
|
|
use Scalar::Util 'blessed'; |
|
16
|
|
|
|
|
|
|
use Data::Dumper; |
|
17
|
|
|
|
|
|
|
use Carp; |
|
18
|
|
|
|
|
|
|
|
|
19
|
|
|
|
|
|
|
our $DEBUG = 0; |
|
20
|
|
|
|
|
|
|
|
|
21
|
|
|
|
|
|
|
=head1 NAME |
|
22
|
|
|
|
|
|
|
|
|
23
|
|
|
|
|
|
|
Chemistry::Mok - molecular awk interpreter |
|
24
|
|
|
|
|
|
|
|
|
25
|
|
|
|
|
|
|
=head1 SYNOPSIS |
|
26
|
|
|
|
|
|
|
|
|
27
|
|
|
|
|
|
|
use Chemistry::Mok; |
|
28
|
|
|
|
|
|
|
$code = '/CS/g{ $n++; $l += $match->bond_map(0)->length } |
|
29
|
|
|
|
|
|
|
END { printf "Average C-S bond length: %.3f\n", $l/$n; }'; |
|
30
|
|
|
|
|
|
|
|
|
31
|
|
|
|
|
|
|
my $mok = Chemistry::Mok->new($code); |
|
32
|
|
|
|
|
|
|
$mok->run({ format => mdlmol }, glob("*.mol")); |
|
33
|
|
|
|
|
|
|
|
|
34
|
|
|
|
|
|
|
=head1 DESCRIPTION |
|
35
|
|
|
|
|
|
|
|
|
36
|
|
|
|
|
|
|
This module is the engine behind the mok program. See mok(1) for a detailed |
|
37
|
|
|
|
|
|
|
description of the language. Mok is part of the PerlMol project, |
|
38
|
|
|
|
|
|
|
L. |
|
39
|
|
|
|
|
|
|
|
|
40
|
|
|
|
|
|
|
=head1 METHODS |
|
41
|
|
|
|
|
|
|
|
|
42
|
|
|
|
|
|
|
=over |
|
43
|
|
|
|
|
|
|
|
|
44
|
|
|
|
|
|
|
=cut |
|
45
|
|
|
|
|
|
|
|
|
46
|
|
|
|
|
|
|
sub tokenize { |
|
47
|
|
|
|
|
|
|
my ($self, $code) = @_; |
|
48
|
|
|
|
|
|
|
|
|
49
|
|
|
|
|
|
|
$code =~ s/\s*$//; # Text::Balanced complains about trailing whitespace |
|
50
|
|
|
|
|
|
|
#$code =~ s/^\s*#.*//g; # remove comments at the top of the file |
|
51
|
|
|
|
|
|
|
#unless($code =~ /^\s*([\/{#]|sub|BEGIN|END)/) { |
|
52
|
|
|
|
|
|
|
unless($code =~ /^(\s*#.*)*\s*([\/{]|sub|BEGIN|END|\w+:\s*\/)/) { |
|
53
|
|
|
|
|
|
|
print "MOK: adding implicit braces\n" if $DEBUG; |
|
54
|
|
|
|
|
|
|
$code = "{$code}"; # add implicit brackets for simple one-liners |
|
55
|
|
|
|
|
|
|
} |
|
56
|
|
|
|
|
|
|
#print "code = '$code'\n"; |
|
57
|
|
|
|
|
|
|
# (patt opt?)? code | sub code |
|
58
|
|
|
|
|
|
|
my @toks = extract_multiple(my $c = $code, |
|
59
|
|
|
|
|
|
|
[ |
|
60
|
|
|
|
|
|
|
{ 'Chemistry::Mok::Comment' => |
|
61
|
|
|
|
|
|
|
qr/\s*#.*\s*/ }, |
|
62
|
|
|
|
|
|
|
{ 'Chemistry::Mok::Patt' => |
|
63
|
|
|
|
|
|
|
sub { scalar extract_delimited($_[0],'/') } }, |
|
64
|
|
|
|
|
|
|
{ 'Chemistry::Mok::Sub' => |
|
65
|
|
|
|
|
|
|
qr/\s*(?:END|BEGIN|sub\s+\w+)\s*/ }, |
|
66
|
|
|
|
|
|
|
{ 'Chemistry::Mok::Block' => |
|
67
|
|
|
|
|
|
|
sub { scalar extract_codeblock($_[0],'{') } }, |
|
68
|
|
|
|
|
|
|
{ 'Chemistry::Mok::PattLang' => |
|
69
|
|
|
|
|
|
|
qr/(\s*\w+):(?=\s*\/)/ }, |
|
70
|
|
|
|
|
|
|
{ 'Chemistry::Mok::Opts' => |
|
71
|
|
|
|
|
|
|
qr/[gopGOP]+/ }, |
|
72
|
|
|
|
|
|
|
], |
|
73
|
|
|
|
|
|
|
); |
|
74
|
|
|
|
|
|
|
die "Mok: error extracting: $@" if $@; |
|
75
|
|
|
|
|
|
|
print "MOK: TOKENS:\n", Dumper(\@toks), "\nCODE:<<<<$code>>>>\n\n" |
|
76
|
|
|
|
|
|
|
if $DEBUG; |
|
77
|
|
|
|
|
|
|
@toks; |
|
78
|
|
|
|
|
|
|
} |
|
79
|
|
|
|
|
|
|
|
|
80
|
|
|
|
|
|
|
sub parse { |
|
81
|
|
|
|
|
|
|
my ($self, @toks) = @_; |
|
82
|
|
|
|
|
|
|
|
|
83
|
|
|
|
|
|
|
my (@subs, @blocks); |
|
84
|
|
|
|
|
|
|
for my $tok (@toks) { |
|
85
|
|
|
|
|
|
|
blessed $tok or die "unparsable token '$tok'\n"; |
|
86
|
|
|
|
|
|
|
} |
|
87
|
|
|
|
|
|
|
|
|
88
|
|
|
|
|
|
|
### new parser |
|
89
|
|
|
|
|
|
|
|
|
90
|
|
|
|
|
|
|
my $st = 1; |
|
91
|
|
|
|
|
|
|
my ($patt, $opts, $block, $sub, $pattlang) = ('') x 5; |
|
92
|
|
|
|
|
|
|
my ($save) = 0; |
|
93
|
|
|
|
|
|
|
my $line; |
|
94
|
|
|
|
|
|
|
my $next_line = 1; |
|
95
|
|
|
|
|
|
|
while (my $tok = shift @toks) { |
|
96
|
|
|
|
|
|
|
$line = $next_line; |
|
97
|
|
|
|
|
|
|
$next_line += $$tok =~ y/\n//; |
|
98
|
|
|
|
|
|
|
print "MOK: LINE=$line;\nTOK=<<<<$$tok>>>>;\nNEXT_LINE=$next_line\n\n" |
|
99
|
|
|
|
|
|
|
if $DEBUG; |
|
100
|
|
|
|
|
|
|
next if $tok->isa("Chemistry::Mok::Comment"); |
|
101
|
|
|
|
|
|
|
if ($st == 1) { |
|
102
|
|
|
|
|
|
|
if ($tok->isa("Chemistry::Mok::Block")){ |
|
103
|
|
|
|
|
|
|
$block = $$tok, $save = 1; |
|
104
|
|
|
|
|
|
|
} elsif ($tok->isa("Chemistry::Mok::Sub")) { |
|
105
|
|
|
|
|
|
|
$sub = $$tok, $st = 5, next; |
|
106
|
|
|
|
|
|
|
} elsif ($tok->isa("Chemistry::Mok::PattLang")) { |
|
107
|
|
|
|
|
|
|
$pattlang = $$tok, $st = 4, next; |
|
108
|
|
|
|
|
|
|
} elsif ($tok->isa("Chemistry::Mok::Patt")) { |
|
109
|
|
|
|
|
|
|
$patt = $$tok, $st = 2, next; |
|
110
|
|
|
|
|
|
|
} |
|
111
|
|
|
|
|
|
|
} elsif ($st == 2) { |
|
112
|
|
|
|
|
|
|
if ($tok->isa("Chemistry::Mok::Block")){ |
|
113
|
|
|
|
|
|
|
$block = $$tok, $save = 1; |
|
114
|
|
|
|
|
|
|
} elsif ($tok->isa("Chemistry::Mok::Opts")){ |
|
115
|
|
|
|
|
|
|
$opts = $$tok, $st = 3, next; |
|
116
|
|
|
|
|
|
|
} |
|
117
|
|
|
|
|
|
|
} elsif ($st == 3) { |
|
118
|
|
|
|
|
|
|
if ($tok->isa("Chemistry::Mok::Block")){ |
|
119
|
|
|
|
|
|
|
$block = $$tok, $save = 1; |
|
120
|
|
|
|
|
|
|
} |
|
121
|
|
|
|
|
|
|
} elsif ($st == 4) { |
|
122
|
|
|
|
|
|
|
if ($tok->isa("Chemistry::Mok::Patt")){ |
|
123
|
|
|
|
|
|
|
$patt = $$tok, $st = 2, next; |
|
124
|
|
|
|
|
|
|
} |
|
125
|
|
|
|
|
|
|
} elsif ($st == 5) { |
|
126
|
|
|
|
|
|
|
if ($tok->isa("Chemistry::Mok::Block")){ |
|
127
|
|
|
|
|
|
|
$block = $$tok, $save = 1; |
|
128
|
|
|
|
|
|
|
} |
|
129
|
|
|
|
|
|
|
} else { |
|
130
|
|
|
|
|
|
|
confess "unknown state '$st'"; |
|
131
|
|
|
|
|
|
|
} |
|
132
|
|
|
|
|
|
|
if ($save) { # save block and go back to state 1 |
|
133
|
|
|
|
|
|
|
if ($sub) { |
|
134
|
|
|
|
|
|
|
push @subs, { block => "$sub $$tok", line => $line }; |
|
135
|
|
|
|
|
|
|
} else { |
|
136
|
|
|
|
|
|
|
push @blocks, { patt => $patt, opts => $opts, |
|
137
|
|
|
|
|
|
|
pattlang => $pattlang, block => $$tok, |
|
138
|
|
|
|
|
|
|
line => $line}; |
|
139
|
|
|
|
|
|
|
} |
|
140
|
|
|
|
|
|
|
$patt = $opts = $pattlang = $block = $sub = ''; |
|
141
|
|
|
|
|
|
|
$st = 1, $save = 0, next; |
|
142
|
|
|
|
|
|
|
} else { |
|
143
|
|
|
|
|
|
|
die "unexpected token '$$tok' (type '" . ref($tok) . "'\n"; |
|
144
|
|
|
|
|
|
|
} |
|
145
|
|
|
|
|
|
|
} |
|
146
|
|
|
|
|
|
|
print "MOK: BLOCKS\n", Dumper(\@blocks), "\nSUBS:\n", Dumper(\@subs), "\n" |
|
147
|
|
|
|
|
|
|
if $DEBUG; |
|
148
|
|
|
|
|
|
|
|
|
149
|
|
|
|
|
|
|
\@subs, \@blocks; |
|
150
|
|
|
|
|
|
|
} |
|
151
|
|
|
|
|
|
|
|
|
152
|
|
|
|
|
|
|
sub compile_subs { |
|
153
|
|
|
|
|
|
|
my ($self, @subs) = @_; |
|
154
|
|
|
|
|
|
|
my $pack = $self->{package}; |
|
155
|
|
|
|
|
|
|
|
|
156
|
|
|
|
|
|
|
for my $sub (@subs) { |
|
157
|
|
|
|
|
|
|
my $code = <
|
|
158
|
|
|
|
|
|
|
package Chemistry::Mok::UserCode::$pack; |
|
159
|
|
|
|
|
|
|
no strict; |
|
160
|
|
|
|
|
|
|
no warnings; |
|
161
|
|
|
|
|
|
|
#line $sub->{line} "mok code" |
|
162
|
|
|
|
|
|
|
$sub->{block} |
|
163
|
|
|
|
|
|
|
END |
|
164
|
|
|
|
|
|
|
print "MOK: COMPILING SUB: <<<<$code>>>>\n\n" if $DEBUG; |
|
165
|
|
|
|
|
|
|
eval $code; |
|
166
|
|
|
|
|
|
|
die "Mok: error compiling sub: $@" if $@; |
|
167
|
|
|
|
|
|
|
} |
|
168
|
|
|
|
|
|
|
} |
|
169
|
|
|
|
|
|
|
|
|
170
|
|
|
|
|
|
|
sub compile_blocks { |
|
171
|
|
|
|
|
|
|
my ($self, @blocks) = @_; |
|
172
|
|
|
|
|
|
|
my $pack = $self->{package}; |
|
173
|
|
|
|
|
|
|
my $format = $self->{pattern_format}; |
|
174
|
|
|
|
|
|
|
my @compiled_blocks; |
|
175
|
|
|
|
|
|
|
|
|
176
|
|
|
|
|
|
|
for my $block (@blocks) { |
|
177
|
|
|
|
|
|
|
#use Data::Dumper; print Dumper $block; |
|
178
|
|
|
|
|
|
|
my $code = <
|
|
179
|
|
|
|
|
|
|
package Chemistry::Mok::UserCode::$pack; |
|
180
|
|
|
|
|
|
|
no strict; |
|
181
|
|
|
|
|
|
|
no warnings; |
|
182
|
|
|
|
|
|
|
sub { |
|
183
|
|
|
|
|
|
|
my (\$mol, \$file, \$match, \$patt) = \@_; |
|
184
|
|
|
|
|
|
|
my (\$MOL, \$FILE, \$MATCH, \$PATT, \$FH) = \@_; |
|
185
|
|
|
|
|
|
|
my (\@A) = \$MATCH ? \$MATCH->atom_map : \$MOL->atoms; |
|
186
|
|
|
|
|
|
|
my (\@B) = \$MATCH ? \$MATCH->bond_map : \$MOL->bonds; |
|
187
|
|
|
|
|
|
|
#line $block->{line} "mok code" |
|
188
|
|
|
|
|
|
|
$block->{block}; |
|
189
|
|
|
|
|
|
|
} |
|
190
|
|
|
|
|
|
|
END |
|
191
|
|
|
|
|
|
|
print "MOK: COMPILING BLOCK: <<<<$code>>>>\n\n" if $DEBUG; |
|
192
|
|
|
|
|
|
|
my $sub = eval $code; |
|
193
|
|
|
|
|
|
|
die "Mol: Error compiling block: $@" if $@; |
|
194
|
|
|
|
|
|
|
|
|
195
|
|
|
|
|
|
|
my ($patt, $patt_str); |
|
196
|
|
|
|
|
|
|
if ($block->{patt}) { |
|
197
|
|
|
|
|
|
|
$block->{patt} =~ m#^/(.*)/$#; |
|
198
|
|
|
|
|
|
|
$patt_str = $1; |
|
199
|
|
|
|
|
|
|
$patt = Chemistry::Pattern->parse($patt_str, |
|
200
|
|
|
|
|
|
|
format => $block->{pattlang} || $format); |
|
201
|
|
|
|
|
|
|
$patt->attr(global => 1) if $block->{opts} =~ /g/; |
|
202
|
|
|
|
|
|
|
$patt->options(overlap => 0) if $block->{opts} =~ /O/; |
|
203
|
|
|
|
|
|
|
$patt->options(permute => 1) if $block->{opts} =~ /p/; |
|
204
|
|
|
|
|
|
|
} |
|
205
|
|
|
|
|
|
|
push @compiled_blocks, {'sub' => $sub, |
|
206
|
|
|
|
|
|
|
patt => $patt, patt_str => $patt_str}; |
|
207
|
|
|
|
|
|
|
} |
|
208
|
|
|
|
|
|
|
\@compiled_blocks; |
|
209
|
|
|
|
|
|
|
} |
|
210
|
|
|
|
|
|
|
|
|
211
|
|
|
|
|
|
|
=item Chemistry::Mok->new($code, %options) |
|
212
|
|
|
|
|
|
|
|
|
213
|
|
|
|
|
|
|
Compile the code and return a Chemistry::Mok object. Available options: |
|
214
|
|
|
|
|
|
|
|
|
215
|
|
|
|
|
|
|
=over |
|
216
|
|
|
|
|
|
|
|
|
217
|
|
|
|
|
|
|
=item C |
|
218
|
|
|
|
|
|
|
|
|
219
|
|
|
|
|
|
|
If the C option is given, the code runs in the |
|
220
|
|
|
|
|
|
|
Chemistry::Mok::UserCode::$options{package} package instead of the |
|
221
|
|
|
|
|
|
|
Chemistry::Mok::UserCode::Default package. Specifying a package name is |
|
222
|
|
|
|
|
|
|
recommended if you have more than one mok object and you are using global |
|
223
|
|
|
|
|
|
|
varaibles, in order to avoid namespace clashes. |
|
224
|
|
|
|
|
|
|
|
|
225
|
|
|
|
|
|
|
=item C |
|
226
|
|
|
|
|
|
|
|
|
227
|
|
|
|
|
|
|
The name of the format which will be used for parsing slash-delimited patterns |
|
228
|
|
|
|
|
|
|
that don't define an explicit format. Mok versions until 0.16 only used the |
|
229
|
|
|
|
|
|
|
'smiles' format, but newer versions can use other formats such as 'smarts', |
|
230
|
|
|
|
|
|
|
'midas', 'formula_pattern', and 'sln', if available. The default is 'smarts'. |
|
231
|
|
|
|
|
|
|
|
|
232
|
|
|
|
|
|
|
=back |
|
233
|
|
|
|
|
|
|
|
|
234
|
|
|
|
|
|
|
=cut |
|
235
|
|
|
|
|
|
|
|
|
236
|
|
|
|
|
|
|
sub new { |
|
237
|
|
|
|
|
|
|
my ($class, $code, @a) = @_; |
|
238
|
|
|
|
|
|
|
my %opts; |
|
239
|
|
|
|
|
|
|
|
|
240
|
|
|
|
|
|
|
# for backwards compatibility with Chemistry::Mok->new($code, $package) |
|
241
|
|
|
|
|
|
|
unshift @a, "package" if (@a == 1); |
|
242
|
|
|
|
|
|
|
%opts = @a; |
|
243
|
|
|
|
|
|
|
|
|
244
|
|
|
|
|
|
|
my $self = bless { |
|
245
|
|
|
|
|
|
|
'package' => $opts{package} || "Default", |
|
246
|
|
|
|
|
|
|
pattern_format => $opts{pattern_format} || "smarts", |
|
247
|
|
|
|
|
|
|
}, $class; |
|
248
|
|
|
|
|
|
|
|
|
249
|
|
|
|
|
|
|
$self->setup_package; |
|
250
|
|
|
|
|
|
|
my @toks = $self->tokenize($code); |
|
251
|
|
|
|
|
|
|
my ($subs, $blocks) = $self->parse(@toks); |
|
252
|
|
|
|
|
|
|
$self->compile_subs(@$subs); |
|
253
|
|
|
|
|
|
|
$self->{blocks} = $self->compile_blocks(@$blocks); |
|
254
|
|
|
|
|
|
|
|
|
255
|
|
|
|
|
|
|
return $self; |
|
256
|
|
|
|
|
|
|
} |
|
257
|
|
|
|
|
|
|
|
|
258
|
|
|
|
|
|
|
sub setup_package { |
|
259
|
|
|
|
|
|
|
my ($self) = @_; |
|
260
|
|
|
|
|
|
|
my $usr_pack = $self->{package}; |
|
261
|
|
|
|
|
|
|
# import convenience functions into the user's namespace |
|
262
|
|
|
|
|
|
|
eval <
|
|
263
|
|
|
|
|
|
|
package Chemistry::Mok::UserCode::$usr_pack; |
|
264
|
|
|
|
|
|
|
use Chemistry::Atom ':all'; |
|
265
|
|
|
|
|
|
|
use Chemistry::Ring ':all'; |
|
266
|
|
|
|
|
|
|
use Chemistry::Ring::Find ':all'; |
|
267
|
|
|
|
|
|
|
use Chemistry::Bond::Find ':all'; |
|
268
|
|
|
|
|
|
|
use Chemistry::Canonicalize ':all'; |
|
269
|
|
|
|
|
|
|
use Chemistry::InternalCoords::Builder ':all'; |
|
270
|
|
|
|
|
|
|
use Chemistry::Isotope ':all'; |
|
271
|
|
|
|
|
|
|
use Math::VectorReal ':all'; |
|
272
|
|
|
|
|
|
|
use Chemistry::3DBuilder ':all'; |
|
273
|
|
|
|
|
|
|
sub println { print "\@_", "\n" } |
|
274
|
|
|
|
|
|
|
EVAL |
|
275
|
|
|
|
|
|
|
die "Mok: error setting up 'Chemistry::Mok::UserCode::$usr_pack' $@" if $@; |
|
276
|
|
|
|
|
|
|
} |
|
277
|
|
|
|
|
|
|
|
|
278
|
|
|
|
|
|
|
=item $mok->run($options, @args) |
|
279
|
|
|
|
|
|
|
|
|
280
|
|
|
|
|
|
|
Run the code on the filenames contained in @args. $options is a hash reference |
|
281
|
|
|
|
|
|
|
with runtime options. Available options: |
|
282
|
|
|
|
|
|
|
|
|
283
|
|
|
|
|
|
|
=over |
|
284
|
|
|
|
|
|
|
|
|
285
|
|
|
|
|
|
|
=item build_3d |
|
286
|
|
|
|
|
|
|
|
|
287
|
|
|
|
|
|
|
Generate 3D coordinates using Chemistry::3DBuilder. |
|
288
|
|
|
|
|
|
|
|
|
289
|
|
|
|
|
|
|
=item aromatize |
|
290
|
|
|
|
|
|
|
|
|
291
|
|
|
|
|
|
|
"Aromatize" each molecule as it is read. This is needed for example for |
|
292
|
|
|
|
|
|
|
matching SMARTS patterns that use aromaticity or ring primitives. |
|
293
|
|
|
|
|
|
|
|
|
294
|
|
|
|
|
|
|
=item delete_dummies |
|
295
|
|
|
|
|
|
|
|
|
296
|
|
|
|
|
|
|
Delete dummy atoms after reading each molecule. A dummy atom is defined as an |
|
297
|
|
|
|
|
|
|
atom with an unknown symbol (i.e., it doesn't appear on the periodic table), or |
|
298
|
|
|
|
|
|
|
an atomic number of zero. |
|
299
|
|
|
|
|
|
|
|
|
300
|
|
|
|
|
|
|
=item find_bonds |
|
301
|
|
|
|
|
|
|
|
|
302
|
|
|
|
|
|
|
If set to a true value, find bonds. Use it when reading files with no bond |
|
303
|
|
|
|
|
|
|
information but 3D coordinates to detect the bonds if needed (for example, if |
|
304
|
|
|
|
|
|
|
you want to do match a pattern that includes bonds). If the file has explicit |
|
305
|
|
|
|
|
|
|
bonds, mok will not try to find the bonds, but it will reassign the bond orders |
|
306
|
|
|
|
|
|
|
from scratch. |
|
307
|
|
|
|
|
|
|
|
|
308
|
|
|
|
|
|
|
=item format |
|
309
|
|
|
|
|
|
|
|
|
310
|
|
|
|
|
|
|
The format used when calling $mol_class->read. If not given, $mol_class->read |
|
311
|
|
|
|
|
|
|
tries to identify the format automatically. |
|
312
|
|
|
|
|
|
|
|
|
313
|
|
|
|
|
|
|
=item mol_class |
|
314
|
|
|
|
|
|
|
|
|
315
|
|
|
|
|
|
|
The molecule class used for reading the files. Defaults to Chemistry::Mol. |
|
316
|
|
|
|
|
|
|
|
|
317
|
|
|
|
|
|
|
=back |
|
318
|
|
|
|
|
|
|
|
|
319
|
|
|
|
|
|
|
=cut |
|
320
|
|
|
|
|
|
|
|
|
321
|
|
|
|
|
|
|
sub run { |
|
322
|
|
|
|
|
|
|
my ($self, $opt, @args) = @_; |
|
323
|
|
|
|
|
|
|
# MAIN LOOP |
|
324
|
|
|
|
|
|
|
my $mol_class = $opt->{mol_class} || "Chemistry::Mol"; |
|
325
|
|
|
|
|
|
|
FILE: for my $file (@args) { |
|
326
|
|
|
|
|
|
|
#my (@mols) = $mol_class->read( |
|
327
|
|
|
|
|
|
|
my %reader_opts = ( |
|
328
|
|
|
|
|
|
|
format => $opt->{format}, |
|
329
|
|
|
|
|
|
|
mol_class => $opt->{mol_class}, |
|
330
|
|
|
|
|
|
|
); |
|
331
|
|
|
|
|
|
|
my $reader = $mol_class->file( |
|
332
|
|
|
|
|
|
|
$file, |
|
333
|
|
|
|
|
|
|
%reader_opts, |
|
334
|
|
|
|
|
|
|
); |
|
335
|
|
|
|
|
|
|
$reader->open('<'); |
|
336
|
|
|
|
|
|
|
$reader->read_header; |
|
337
|
|
|
|
|
|
|
while (my @mols = $reader->read_mol($reader->fh, %reader_opts)) { |
|
338
|
|
|
|
|
|
|
MOL: for my $mol (@mols) { |
|
339
|
|
|
|
|
|
|
if ($opt->{delete_dummies}) { |
|
340
|
|
|
|
|
|
|
$_->delete for grep { ! $_->Z } $mol->atoms; |
|
341
|
|
|
|
|
|
|
} |
|
342
|
|
|
|
|
|
|
if ($opt->{find_bonds}) { |
|
343
|
|
|
|
|
|
|
find_bonds($mol) unless $mol->bonds; |
|
344
|
|
|
|
|
|
|
assign_bond_orders($mol); |
|
345
|
|
|
|
|
|
|
} |
|
346
|
|
|
|
|
|
|
if ($opt->{aromatize}) { |
|
347
|
|
|
|
|
|
|
aromatize_mol($mol); |
|
348
|
|
|
|
|
|
|
} |
|
349
|
|
|
|
|
|
|
if ($opt->{build_3d}) { |
|
350
|
|
|
|
|
|
|
build_3d($mol); |
|
351
|
|
|
|
|
|
|
} |
|
352
|
|
|
|
|
|
|
BLOCK: for my $block (@{$self->{blocks}}) { |
|
353
|
|
|
|
|
|
|
my ($code_block, $patt, $patt_str) = |
|
354
|
|
|
|
|
|
|
@{$block}{qw(sub patt patt_str)}; |
|
355
|
|
|
|
|
|
|
if ($patt) { |
|
356
|
|
|
|
|
|
|
MATCH: while ($patt->match($mol)) { |
|
357
|
|
|
|
|
|
|
$code_block->($mol, $file, $patt, |
|
358
|
|
|
|
|
|
|
$patt_str, $reader->fh); |
|
359
|
|
|
|
|
|
|
last unless $patt->attr('global'); |
|
360
|
|
|
|
|
|
|
} |
|
361
|
|
|
|
|
|
|
} else { |
|
362
|
|
|
|
|
|
|
$code_block->($mol, $file, $patt, |
|
363
|
|
|
|
|
|
|
$patt_str, $reader->fh); |
|
364
|
|
|
|
|
|
|
} |
|
365
|
|
|
|
|
|
|
} |
|
366
|
|
|
|
|
|
|
} |
|
367
|
|
|
|
|
|
|
} |
|
368
|
|
|
|
|
|
|
} |
|
369
|
|
|
|
|
|
|
} |
|
370
|
|
|
|
|
|
|
|
|
371
|
|
|
|
|
|
|
1; |
|
372
|
|
|
|
|
|
|
|
|
373
|
|
|
|
|
|
|
__END__ |