line |
stmt |
bran |
cond |
sub |
pod |
time |
code |
1
|
|
|
|
|
|
|
package Bio::RNA::Barriers::Minimum; |
2
|
|
|
|
|
|
|
our $VERSION = '0.01'; |
3
|
|
|
|
|
|
|
|
4
|
11
|
|
|
11
|
|
206
|
use 5.012; |
|
11
|
|
|
|
|
39
|
|
5
|
11
|
|
|
11
|
|
101
|
use strict; |
|
11
|
|
|
|
|
44
|
|
|
11
|
|
|
|
|
315
|
|
6
|
11
|
|
|
11
|
|
71
|
use warnings; |
|
11
|
|
|
|
|
21
|
|
|
11
|
|
|
|
|
437
|
|
7
|
|
|
|
|
|
|
|
8
|
11
|
|
|
11
|
|
6437
|
use Moose; |
|
11
|
|
|
|
|
5498797
|
|
|
11
|
|
|
|
|
82
|
|
9
|
11
|
|
|
11
|
|
92018
|
use MooseX::StrictConstructor; |
|
11
|
|
|
|
|
369173
|
|
|
11
|
|
|
|
|
49
|
|
10
|
11
|
|
|
11
|
|
113233
|
use Moose::Util::TypeConstraints; |
|
11
|
|
|
|
|
33
|
|
|
11
|
|
|
|
|
110
|
|
11
|
11
|
|
|
11
|
|
27124
|
use namespace::autoclean; |
|
11
|
|
|
|
|
31
|
|
|
11
|
|
|
|
|
63
|
|
12
|
|
|
|
|
|
|
|
13
|
11
|
|
|
11
|
|
7665
|
use autodie qw(:all); |
|
11
|
|
|
|
|
165141
|
|
|
11
|
|
|
|
|
71
|
|
14
|
11
|
|
|
11
|
|
219559
|
use overload q{""} => 'stringify'; |
|
11
|
|
|
|
|
31
|
|
|
11
|
|
|
|
|
67
|
|
15
|
|
|
|
|
|
|
|
16
|
11
|
|
|
11
|
|
778
|
use Scalar::Util qw(blessed); |
|
11
|
|
|
|
|
24
|
|
|
11
|
|
|
|
|
632
|
|
17
|
11
|
|
|
11
|
|
72
|
use List::Util qw(max); |
|
11
|
|
|
|
|
25
|
|
|
11
|
|
|
|
|
567
|
|
18
|
11
|
|
|
11
|
|
7555
|
use List::MoreUtils qw(zip); |
|
11
|
|
|
|
|
153723
|
|
|
11
|
|
|
|
|
81
|
|
19
|
|
|
|
|
|
|
|
20
|
|
|
|
|
|
|
#### Special types for attribute checking. |
21
|
|
|
|
|
|
|
subtype 'RNAStruct' => ( |
22
|
|
|
|
|
|
|
as 'Str', |
23
|
|
|
|
|
|
|
where { m{ ^ [(.)]+ $ }x }, |
24
|
|
|
|
|
|
|
message { |
25
|
|
|
|
|
|
|
"Only '(', ')', and '.' allowed in structure string, found '$_'" |
26
|
|
|
|
|
|
|
}, |
27
|
|
|
|
|
|
|
); |
28
|
|
|
|
|
|
|
|
29
|
|
|
|
|
|
|
subtype 'DisconSaddle' => ( |
30
|
|
|
|
|
|
|
as 'Str', |
31
|
|
|
|
|
|
|
where { m{ ^ ~+ $ }x }, |
32
|
|
|
|
|
|
|
message { |
33
|
|
|
|
|
|
|
"Only '~' allowed in disconnected saddle string, found '$_'" |
34
|
|
|
|
|
|
|
}, |
35
|
|
|
|
|
|
|
); |
36
|
|
|
|
|
|
|
|
37
|
|
|
|
|
|
|
# index - index of basins ordered by energy; 1 is lowest |
38
|
|
|
|
|
|
|
# struct - struct of lowest energy in minimums |
39
|
|
|
|
|
|
|
# mfe - free energy of the basin's local minimum |
40
|
|
|
|
|
|
|
# father_index - index of father basin (the basin this one is merged to) |
41
|
|
|
|
|
|
|
# barrier_height - height of energy barrier (in kcal/mol) to minimum this |
42
|
|
|
|
|
|
|
# one is merged to (relative to this minimum) |
43
|
|
|
|
|
|
|
my @default_attribs = qw( index struct mfe father_index barrier_height); |
44
|
|
|
|
|
|
|
my @default_attrib_args = (is => 'rw', required => 1); |
45
|
|
|
|
|
|
|
my %default_attrib_isa |
46
|
|
|
|
|
|
|
= &zip(\@default_attribs, [qw(Int RNAStruct Num Int Num)]); |
47
|
|
|
|
|
|
|
has $_ => (@default_attrib_args, isa => $default_attrib_isa{$_}) |
48
|
|
|
|
|
|
|
foreach @default_attribs; |
49
|
|
|
|
|
|
|
|
50
|
|
|
|
|
|
|
# Return true iff this is the mfe basin 1. |
51
|
|
|
|
|
|
|
sub is_global_min { |
52
|
0
|
|
|
0
|
1
|
0
|
my $self = shift; |
53
|
0
|
|
|
|
|
0
|
my $is_global_min = $self->index == 1; |
54
|
0
|
|
|
|
|
0
|
return $is_global_min; |
55
|
|
|
|
|
|
|
} |
56
|
|
|
|
|
|
|
|
57
|
|
|
|
|
|
|
# Optional attributes generated by Barriers options --bsize and --saddle. |
58
|
|
|
|
|
|
|
# Descriptions in quotes are from Barriers tutorial at |
59
|
|
|
|
|
|
|
# https://www.tbi.univie.ac.at/RNA/tutorial/#sec4_2 |
60
|
|
|
|
|
|
|
# merged_struct_count - 'numbers of structures in the basin we merge with' |
61
|
|
|
|
|
|
|
# Given is the number of structures in the *current* basin |
62
|
|
|
|
|
|
|
# (including merged ones) *at the time of merging*. For minimum 1, |
63
|
|
|
|
|
|
|
# this is close to the total number of input structures (except for |
64
|
|
|
|
|
|
|
# disconnected structures and other missing ones (???). |
65
|
|
|
|
|
|
|
# father_struct_count - 'number of basin which we merge to' |
66
|
|
|
|
|
|
|
# Actually, it's the number of *structures* in the basin that we |
67
|
|
|
|
|
|
|
# merge to (father basin) *at the time of merging*. |
68
|
|
|
|
|
|
|
# merged_basin_energy - 'free energy of the basin' |
69
|
|
|
|
|
|
|
# This seems to be the free energy of (the partition function of) |
70
|
|
|
|
|
|
|
# the basin---including all merged basins---at the time this basin |
71
|
|
|
|
|
|
|
# is merged. For minimum 1, this corresponds to the ensemble free |
72
|
|
|
|
|
|
|
# energy as far as it was enumerated by RNAsubopt (excluding |
73
|
|
|
|
|
|
|
# disconnected structures). |
74
|
|
|
|
|
|
|
# grad_struct_count - 'number of structures in this basin using gradient walk' |
75
|
|
|
|
|
|
|
# This seems to be the actual number of structures only in this |
76
|
|
|
|
|
|
|
# basin, excluding merged basins. What about --minh merging? Why |
77
|
|
|
|
|
|
|
# doesn't this column sum up to exactly to the total number of |
78
|
|
|
|
|
|
|
# structs if --max==Inf (some are missing)? Issues due to degenerate |
79
|
|
|
|
|
|
|
# energies? |
80
|
|
|
|
|
|
|
# grad_basin_energy - 'gradient basin (consisting of all structures where |
81
|
|
|
|
|
|
|
# gradientwalk ends in the minimum)' |
82
|
|
|
|
|
|
|
# This seems to be free energy of the basin without any merged |
83
|
|
|
|
|
|
|
# basins. Summing up the partition functions corresponding to these |
84
|
|
|
|
|
|
|
# energies, one obtains a free energy almost equal to the ensemble |
85
|
|
|
|
|
|
|
# energy (up to rounding errors due to 6 digit precision). |
86
|
|
|
|
|
|
|
my @bsize_attributes = qw( |
87
|
|
|
|
|
|
|
merged_struct_count father_struct_count merged_basin_energy |
88
|
|
|
|
|
|
|
grad_struct_count grad_basin_energy |
89
|
|
|
|
|
|
|
); |
90
|
|
|
|
|
|
|
my @opt_attributes = (@bsize_attributes, qw(saddle_struct)); |
91
|
|
|
|
|
|
|
# Define a bsize predicate only for the first bsize attribute. Ensure in |
92
|
|
|
|
|
|
|
# BUILD that either all or none of the attributes are set. |
93
|
|
|
|
|
|
|
my @common_attrib_args = ( |
94
|
|
|
|
|
|
|
is => 'ro', |
95
|
|
|
|
|
|
|
lazy => 1, |
96
|
|
|
|
|
|
|
default => sub { confess 'attribute undefined, did you use --bsize/--saddle?' }, |
97
|
|
|
|
|
|
|
); |
98
|
|
|
|
|
|
|
# has $bsize_attributes[0] => (is => 'ro', predicate => 'has_bsize' ); |
99
|
|
|
|
|
|
|
# has $_ => (is => 'ro') foreach @bsize_attributes[1..$#bsize_attributes]; |
100
|
|
|
|
|
|
|
# has 'saddle_struct' => (is => 'ro', predicate => 'has_saddle_struct'); |
101
|
|
|
|
|
|
|
has $bsize_attributes[0] => ( |
102
|
|
|
|
|
|
|
@common_attrib_args, |
103
|
|
|
|
|
|
|
isa => 'Num', |
104
|
|
|
|
|
|
|
predicate => 'has_bsize', |
105
|
|
|
|
|
|
|
writer => "_$bsize_attributes[0]", # private writer |
106
|
|
|
|
|
|
|
); |
107
|
|
|
|
|
|
|
has $_ => (@common_attrib_args, writer => "_$_") # private writer |
108
|
|
|
|
|
|
|
foreach @bsize_attributes[1..$#bsize_attributes]; |
109
|
|
|
|
|
|
|
has 'saddle_struct' => ( |
110
|
|
|
|
|
|
|
@common_attrib_args, |
111
|
|
|
|
|
|
|
isa => 'RNAStruct | DisconSaddle', |
112
|
|
|
|
|
|
|
predicate => 'has_saddle_struct', |
113
|
|
|
|
|
|
|
); |
114
|
|
|
|
|
|
|
|
115
|
|
|
|
|
|
|
# Optional reference to the father minimum. |
116
|
|
|
|
|
|
|
has 'father' => ( |
117
|
|
|
|
|
|
|
is => 'rw', |
118
|
|
|
|
|
|
|
trigger => \&_check_father, |
119
|
|
|
|
|
|
|
# Use name 'has_father_REF' because has_father==false reads as if the |
120
|
|
|
|
|
|
|
# min does not have a father at all. |
121
|
|
|
|
|
|
|
# We don't need this, we always have it if we have a father. |
122
|
|
|
|
|
|
|
# predicate => 'has_father_ref', |
123
|
|
|
|
|
|
|
); |
124
|
|
|
|
|
|
|
|
125
|
|
|
|
|
|
|
sub _check_father { |
126
|
514
|
|
|
514
|
|
965
|
my ($self, $father) = @_; |
127
|
514
|
50
|
33
|
|
|
3045
|
confess 'Need a reference to another minimum to set father attribute' |
128
|
|
|
|
|
|
|
unless blessed $father and $father->isa( __PACKAGE__ ); |
129
|
514
|
50
|
|
|
|
15664
|
confess "Father's index does not match the index used during construction" |
130
|
|
|
|
|
|
|
unless $self->father_index == $father->index; |
131
|
|
|
|
|
|
|
} |
132
|
|
|
|
|
|
|
|
133
|
|
|
|
|
|
|
# Returns true iff the minimum has a father minimum it has been merged to. |
134
|
|
|
|
|
|
|
sub has_father { |
135
|
551
|
|
|
551
|
1
|
922
|
my $self = shift; |
136
|
551
|
|
|
|
|
16420
|
my $has_father = $self->father_index > 0; |
137
|
551
|
|
|
|
|
1913
|
return $has_father; |
138
|
|
|
|
|
|
|
} |
139
|
|
|
|
|
|
|
|
140
|
|
|
|
|
|
|
|
141
|
|
|
|
|
|
|
# Minimum is connected to basin 1 (mfe). |
142
|
|
|
|
|
|
|
has 'is_connected' => ( |
143
|
|
|
|
|
|
|
is => 'ro', |
144
|
|
|
|
|
|
|
lazy => 1, |
145
|
|
|
|
|
|
|
init_arg => undef, # cannot be set manually |
146
|
|
|
|
|
|
|
builder => '_build_is_connected', |
147
|
|
|
|
|
|
|
); |
148
|
|
|
|
|
|
|
|
149
|
|
|
|
|
|
|
sub _build_is_connected { |
150
|
12
|
|
|
12
|
|
21
|
my $self = shift; |
151
|
|
|
|
|
|
|
|
152
|
12
|
100
|
|
|
|
350
|
return 1 if $self->index == 1; # this is the mfe basin |
153
|
11
|
100
|
|
|
|
116
|
return 0 unless $self->has_father; # basin has no father |
154
|
|
|
|
|
|
|
|
155
|
|
|
|
|
|
|
# confess 'Reference to father minimum has not been set, cannot proceed.' |
156
|
|
|
|
|
|
|
# unless $self->has_father_ref; |
157
|
|
|
|
|
|
|
|
158
|
10
|
|
|
|
|
289
|
my $is_connected = $self->father->is_connected; |
159
|
10
|
|
|
|
|
302
|
return $is_connected; |
160
|
|
|
|
|
|
|
} |
161
|
|
|
|
|
|
|
|
162
|
|
|
|
|
|
|
# Parse passed line read from barriers file. |
163
|
|
|
|
|
|
|
around BUILDARGS => sub { |
164
|
|
|
|
|
|
|
my $orig = shift; |
165
|
|
|
|
|
|
|
my $class = shift; |
166
|
|
|
|
|
|
|
|
167
|
|
|
|
|
|
|
my @args; # as passed to the constructor |
168
|
|
|
|
|
|
|
if ( @_ == 1 && !ref $_[0] ) { # process line from bar file |
169
|
|
|
|
|
|
|
my $input_line = shift; |
170
|
|
|
|
|
|
|
my @fields = split /\s+/, $input_line; |
171
|
|
|
|
|
|
|
shift @fields if $fields[0] eq q{}; # drop empty first field |
172
|
|
|
|
|
|
|
|
173
|
|
|
|
|
|
|
if (@fields < @default_attribs) { |
174
|
|
|
|
|
|
|
confess "Input line has not enough fields: $input_line"; |
175
|
|
|
|
|
|
|
} |
176
|
|
|
|
|
|
|
|
177
|
|
|
|
|
|
|
# Add default args |
178
|
|
|
|
|
|
|
push @args, $_ => shift @fields foreach @default_attribs; |
179
|
|
|
|
|
|
|
# @args = map { $_ => shift @fields } @attributes; |
180
|
|
|
|
|
|
|
|
181
|
|
|
|
|
|
|
# Add saddle struct if present |
182
|
|
|
|
|
|
|
if (@fields == 1 or @fields == @opt_attributes) { |
183
|
|
|
|
|
|
|
push @args, saddle_struct => shift @fields; |
184
|
|
|
|
|
|
|
} |
185
|
|
|
|
|
|
|
|
186
|
|
|
|
|
|
|
# Add bsize attributes if present |
187
|
|
|
|
|
|
|
if (@fields == @bsize_attributes) { |
188
|
|
|
|
|
|
|
push @args, $_ => shift @fields foreach @bsize_attributes; |
189
|
|
|
|
|
|
|
} |
190
|
|
|
|
|
|
|
|
191
|
|
|
|
|
|
|
confess "Unrecognized number of fields on input line:\n$input_line" |
192
|
|
|
|
|
|
|
unless @fields == 0; # all fields used up? |
193
|
|
|
|
|
|
|
} |
194
|
|
|
|
|
|
|
else { |
195
|
|
|
|
|
|
|
@args = @_; |
196
|
|
|
|
|
|
|
} |
197
|
|
|
|
|
|
|
return $class->$orig(@args); |
198
|
|
|
|
|
|
|
}; |
199
|
|
|
|
|
|
|
|
200
|
|
|
|
|
|
|
sub BUILD { |
201
|
563
|
|
|
563
|
0
|
1012
|
my $self = shift; |
202
|
|
|
|
|
|
|
|
203
|
|
|
|
|
|
|
# Ensure presence or absence of all bsize attributes |
204
|
563
|
|
|
|
|
1107
|
my $defined_count = grep {defined $self->{$_}} @bsize_attributes; |
|
2815
|
|
|
|
|
6141
|
|
205
|
563
|
50
|
66
|
|
|
17575
|
confess "Need to define all or none of the --bsize attributes ", |
206
|
|
|
|
|
|
|
join q{, }, @bsize_attributes |
207
|
|
|
|
|
|
|
unless $defined_count == 0 or $defined_count == @bsize_attributes; |
208
|
|
|
|
|
|
|
} |
209
|
|
|
|
|
|
|
|
210
|
|
|
|
|
|
|
# Determine all ancestor minima of this minimum, i.e. this minimum's |
211
|
|
|
|
|
|
|
# father, grand father, grand grand father etc. in this order. |
212
|
|
|
|
|
|
|
# Returns list of all ancestors (may be empty if min is disconnected). |
213
|
|
|
|
|
|
|
sub ancestors { |
214
|
0
|
|
|
0
|
1
|
0
|
my ($self) = @_; |
215
|
|
|
|
|
|
|
|
216
|
0
|
|
|
|
|
0
|
my $ancestor = $self; |
217
|
0
|
|
|
|
|
0
|
my @ancestors; |
218
|
0
|
|
|
|
|
0
|
while ($ancestor->has_father) { |
219
|
|
|
|
|
|
|
# confess 'Need father reference to determine ancestors' |
220
|
|
|
|
|
|
|
# unless $ancestor->has_father_ref; |
221
|
0
|
|
|
|
|
0
|
push @ancestors, $ancestor->father; |
222
|
0
|
|
|
|
|
0
|
$ancestor = $ancestor->father; |
223
|
|
|
|
|
|
|
} |
224
|
|
|
|
|
|
|
|
225
|
0
|
|
|
|
|
0
|
return @ancestors; |
226
|
|
|
|
|
|
|
} |
227
|
|
|
|
|
|
|
|
228
|
|
|
|
|
|
|
# Stringify minimum to equal an entry line in the barriers output file. |
229
|
|
|
|
|
|
|
# Format strings are taken from Barriers' C source code. |
230
|
|
|
|
|
|
|
sub stringify { |
231
|
528
|
|
|
528
|
1
|
959
|
my $self = shift; |
232
|
|
|
|
|
|
|
|
233
|
|
|
|
|
|
|
# Default attributes |
234
|
528
|
|
|
|
|
999
|
my $min_string = $self->brief; |
235
|
|
|
|
|
|
|
|
236
|
|
|
|
|
|
|
# Add saddle struct if defined. |
237
|
528
|
100
|
|
|
|
20164
|
if ($self->has_saddle_struct) { |
238
|
264
|
|
|
|
|
7913
|
$min_string .= q{ } . $self->saddle_struct; |
239
|
|
|
|
|
|
|
} |
240
|
|
|
|
|
|
|
|
241
|
|
|
|
|
|
|
# Add bsize attributes if defined. |
242
|
528
|
100
|
|
|
|
18493
|
if ($self->has_bsize) { |
243
|
|
|
|
|
|
|
$min_string .= sprintf " %12ld %8ld %10.6f %8ld %10.6f", |
244
|
264
|
|
|
|
|
528
|
map {$self->{$_}} @bsize_attributes; |
|
1320
|
|
|
|
|
5166
|
|
245
|
|
|
|
|
|
|
} |
246
|
|
|
|
|
|
|
|
247
|
528
|
|
|
|
|
2955
|
return $min_string; |
248
|
|
|
|
|
|
|
} |
249
|
|
|
|
|
|
|
|
250
|
|
|
|
|
|
|
# Stringification method returning a more brief representation of the |
251
|
|
|
|
|
|
|
# minimum containing only the index, min struct, its energy, the father's |
252
|
|
|
|
|
|
|
# index, and the barrier height. This equals the output of Barriers if |
253
|
|
|
|
|
|
|
# neither --bsize nor --saddle is given. |
254
|
|
|
|
|
|
|
sub brief { |
255
|
528
|
|
|
528
|
1
|
753
|
my $self = shift; |
256
|
|
|
|
|
|
|
|
257
|
|
|
|
|
|
|
# Default attributes |
258
|
|
|
|
|
|
|
my $brief_string = sprintf "%4d %s %6.2f %4d %6.2f", |
259
|
528
|
|
|
|
|
934
|
map {$self->{$_}} @default_attribs; |
|
2640
|
|
|
|
|
11009
|
|
260
|
|
|
|
|
|
|
|
261
|
528
|
|
|
|
|
1940
|
return $brief_string; |
262
|
|
|
|
|
|
|
} |
263
|
|
|
|
|
|
|
|
264
|
|
|
|
|
|
|
# ABSOLUTE energy of the lowest structure connecting this basin to another |
265
|
|
|
|
|
|
|
# one. The barrier height, in contrast, is the RELATIVE energy of the same |
266
|
|
|
|
|
|
|
# structure w.r.t. to the basin's (local) mfe. |
267
|
|
|
|
|
|
|
# BEWARE: if the basin does not have a father (father == 0), then the |
268
|
|
|
|
|
|
|
# barrier height is (as reported by Barriers) given with respect to the global exploration |
269
|
|
|
|
|
|
|
# threshold. |
270
|
|
|
|
|
|
|
# Since this gives unexpected results, the saddle height is set to the |
271
|
|
|
|
|
|
|
# global mfe for basin 1, and to Inf for disconnected basins. |
272
|
|
|
|
|
|
|
sub saddle_height { |
273
|
0
|
|
|
0
|
1
|
|
my $self = shift; |
274
|
|
|
|
|
|
|
|
275
|
|
|
|
|
|
|
# Mfe basin is connected to itself with a barrier of 0. Other |
276
|
|
|
|
|
|
|
# fatherless basins are disconnected and thus have an unknown saddle |
277
|
|
|
|
|
|
|
# height -- set to Inf. |
278
|
0
|
0
|
|
|
|
|
my $barrier_height = $self->has_father ? $self->barrier_height |
|
|
0
|
|
|
|
|
|
279
|
|
|
|
|
|
|
: $self->is_global_min ? 0 |
280
|
|
|
|
|
|
|
: 'Inf' |
281
|
|
|
|
|
|
|
; |
282
|
|
|
|
|
|
|
|
283
|
|
|
|
|
|
|
# Energy values from Bar file have only 2 digits precision. |
284
|
0
|
|
|
|
|
|
my $saddle_height = sprintf "%.2f", $self->mfe + $barrier_height; |
285
|
0
|
|
|
|
|
|
return $saddle_height; |
286
|
|
|
|
|
|
|
} |
287
|
|
|
|
|
|
|
|
288
|
|
|
|
|
|
|
# Saddle height as described for saddle_height(), but with respect to the |
289
|
|
|
|
|
|
|
# global mfe structure (basin 1). |
290
|
|
|
|
|
|
|
sub global_saddle_height { |
291
|
0
|
|
|
0
|
1
|
|
my $self = shift; |
292
|
|
|
|
|
|
|
|
293
|
|
|
|
|
|
|
# Move up in barrier tree until reachin basin 1 or realizing we are |
294
|
|
|
|
|
|
|
# disconnected. Global saddle height is maximal encountered height. |
295
|
0
|
|
|
|
|
|
my $ancestor = $self; |
296
|
0
|
|
|
|
|
|
my $glob_sadd_height = $self->saddle_height; |
297
|
0
|
|
|
|
|
|
while ($ancestor->father_index > 1) { |
298
|
0
|
|
|
|
|
|
$ancestor = $ancestor->father; |
299
|
0
|
|
|
|
|
|
$glob_sadd_height |
300
|
|
|
|
|
|
|
= max $glob_sadd_height, $ancestor->saddle_height; |
301
|
|
|
|
|
|
|
} |
302
|
|
|
|
|
|
|
|
303
|
0
|
|
|
|
|
|
return $glob_sadd_height; |
304
|
|
|
|
|
|
|
} |
305
|
|
|
|
|
|
|
|
306
|
|
|
|
|
|
|
__PACKAGE__->meta->make_immutable; |
307
|
|
|
|
|
|
|
|
308
|
|
|
|
|
|
|
1; |
309
|
|
|
|
|
|
|
|
310
|
|
|
|
|
|
|
|
311
|
|
|
|
|
|
|
__END__ |
312
|
|
|
|
|
|
|
|
313
|
|
|
|
|
|
|
=pod |
314
|
|
|
|
|
|
|
|
315
|
|
|
|
|
|
|
=encoding UTF-8 |
316
|
|
|
|
|
|
|
|
317
|
|
|
|
|
|
|
=head1 NAME |
318
|
|
|
|
|
|
|
|
319
|
|
|
|
|
|
|
Bio::RNA::Barriers::Minimum - Store a single local minimum |
320
|
|
|
|
|
|
|
(macrostate) from the output of I<Barriers> |
321
|
|
|
|
|
|
|
|
322
|
|
|
|
|
|
|
=head1 SYNOPSIS |
323
|
|
|
|
|
|
|
|
324
|
|
|
|
|
|
|
use Bio::RNA::Barriers; |
325
|
|
|
|
|
|
|
|
326
|
|
|
|
|
|
|
my $min_string = '...'; # single line from .bar file |
327
|
|
|
|
|
|
|
my $min = Bio::RNA::Barriers::Minimum->new($min_string); |
328
|
|
|
|
|
|
|
# my $min2 = $results->get_min(3) # usually used like this |
329
|
|
|
|
|
|
|
|
330
|
|
|
|
|
|
|
print "$min\n"; # prints minimum as in the results file |
331
|
|
|
|
|
|
|
|
332
|
|
|
|
|
|
|
if ($min->has_bsize and $min->is_connected) |
333
|
|
|
|
|
|
|
print "Minimum contributes an energy of ", $min->grad_basin_energy(), |
334
|
|
|
|
|
|
|
" to the partition function." |
335
|
|
|
|
|
|
|
|
336
|
|
|
|
|
|
|
|
337
|
|
|
|
|
|
|
=head1 DESCRIPTION |
338
|
|
|
|
|
|
|
|
339
|
|
|
|
|
|
|
Objects of this class repesent the individual local minima (macrostates) from |
340
|
|
|
|
|
|
|
the results file of I<Barriers>. The construction is usually done |
341
|
|
|
|
|
|
|
automatically by the results objects (cf. L<Bio::RNA::Barriers::Results>). The |
342
|
|
|
|
|
|
|
methods can be used for various queries. |
343
|
|
|
|
|
|
|
|
344
|
|
|
|
|
|
|
|
345
|
|
|
|
|
|
|
=head1 METHODS |
346
|
|
|
|
|
|
|
|
347
|
|
|
|
|
|
|
=head3 $min->new($results_file_line) |
348
|
|
|
|
|
|
|
|
349
|
|
|
|
|
|
|
Construct a minimum object from a single line of the I<Barriers> results file. |
350
|
|
|
|
|
|
|
|
351
|
|
|
|
|
|
|
=head3 $min->ancestors() |
352
|
|
|
|
|
|
|
|
353
|
|
|
|
|
|
|
Determine all ancestor minima of this minimum, i.e. this minimum's father, |
354
|
|
|
|
|
|
|
grand father, grand grand father etc. in this order. Returns a list of all |
355
|
|
|
|
|
|
|
ancestors (may be empty if min is disconnected). |
356
|
|
|
|
|
|
|
|
357
|
|
|
|
|
|
|
=head3 $min->has_bsize() |
358
|
|
|
|
|
|
|
|
359
|
|
|
|
|
|
|
Boolean. True iff the minimum provides information about the basin size as |
360
|
|
|
|
|
|
|
computed by the I<Barriers> option C<--bsize>. |
361
|
|
|
|
|
|
|
|
362
|
|
|
|
|
|
|
=head3 $min->merged_struct_count() |
363
|
|
|
|
|
|
|
|
364
|
|
|
|
|
|
|
Given is the number of structures in the current basin (including merged ones) |
365
|
|
|
|
|
|
|
B<at the time of merging>. For minimum 1, this is close to the total number of |
366
|
|
|
|
|
|
|
input structures (except for disconnected structures and other missing ones |
367
|
|
|
|
|
|
|
(???)). |
368
|
|
|
|
|
|
|
|
369
|
|
|
|
|
|
|
This attribute is only available if Barriers was used with the C<--bsize> |
370
|
|
|
|
|
|
|
option. Use C<$min-E<gt>has_bsize()> to query this. |
371
|
|
|
|
|
|
|
|
372
|
|
|
|
|
|
|
=head3 $min->father_struct_count() |
373
|
|
|
|
|
|
|
|
374
|
|
|
|
|
|
|
The number of structures in the basin that we merge into (father basin) B<at |
375
|
|
|
|
|
|
|
the time of merging>. |
376
|
|
|
|
|
|
|
|
377
|
|
|
|
|
|
|
This attribute is only available if Barriers was used with the C<--bsize> |
378
|
|
|
|
|
|
|
option. Use C<$min-E<gt>has_bsize()> to query this. |
379
|
|
|
|
|
|
|
|
380
|
|
|
|
|
|
|
=head3 $min->merged_basin_energy() |
381
|
|
|
|
|
|
|
|
382
|
|
|
|
|
|
|
The free energy of (the partition function of) the basin -- including all |
383
|
|
|
|
|
|
|
merged basins -- at the time B<this> basin is merged. For minimum 1, this |
384
|
|
|
|
|
|
|
corresponds to the ensemble's free energy as far as it was enumerated by |
385
|
|
|
|
|
|
|
RNAsubopt (excluding disconnected structures). |
386
|
|
|
|
|
|
|
|
387
|
|
|
|
|
|
|
This attribute is only available if Barriers was used with the C<--bsize> |
388
|
|
|
|
|
|
|
option. Use C<$min-E<gt>has_bsize()> to query this. |
389
|
|
|
|
|
|
|
|
390
|
|
|
|
|
|
|
=head3 $min->grad_struct_count() |
391
|
|
|
|
|
|
|
|
392
|
|
|
|
|
|
|
The number of structures only in this gradient basin, excluding merged basins. |
393
|
|
|
|
|
|
|
|
394
|
|
|
|
|
|
|
Open questions: What about --minh merging? Why doesn't this column sum up to |
395
|
|
|
|
|
|
|
exactly to the total number of structs if --max==Inf (some are missing)? |
396
|
|
|
|
|
|
|
Issues due to degenerate energies? |
397
|
|
|
|
|
|
|
|
398
|
|
|
|
|
|
|
This attribute is only available if Barriers was used with the C<--bsize> |
399
|
|
|
|
|
|
|
option. Use C<$min-E<gt>has_bsize()> to query this. |
400
|
|
|
|
|
|
|
|
401
|
|
|
|
|
|
|
=head3 $min->grad_basin_energy() |
402
|
|
|
|
|
|
|
|
403
|
|
|
|
|
|
|
Free energy of the basin without any merged basins. Summing |
404
|
|
|
|
|
|
|
up the partition functions corresponding to these energies, one obtains a free |
405
|
|
|
|
|
|
|
energy almost equal to the ensemble energy (up to rounding errors due to 6 |
406
|
|
|
|
|
|
|
digit precision, and of course up to the enumeration threshold used for |
407
|
|
|
|
|
|
|
I<RNAsubopt>). |
408
|
|
|
|
|
|
|
|
409
|
|
|
|
|
|
|
This attribute is only available if Barriers was used with the C<--bsize> |
410
|
|
|
|
|
|
|
option. Use C<$min-E<gt>has_bsize()> to query this. |
411
|
|
|
|
|
|
|
|
412
|
|
|
|
|
|
|
=head3 $min->is_global_min() |
413
|
|
|
|
|
|
|
|
414
|
|
|
|
|
|
|
Returns true iff this is the global minimum (i.e. basin 1). |
415
|
|
|
|
|
|
|
|
416
|
|
|
|
|
|
|
=head3 $min->index() |
417
|
|
|
|
|
|
|
|
418
|
|
|
|
|
|
|
1-based index of the minimum (as is the Barriers file). |
419
|
|
|
|
|
|
|
|
420
|
|
|
|
|
|
|
=head3 $min->struct() |
421
|
|
|
|
|
|
|
|
422
|
|
|
|
|
|
|
Returns the dot-bracket structure string of the minimum. |
423
|
|
|
|
|
|
|
|
424
|
|
|
|
|
|
|
=head3 $min->mfe() |
425
|
|
|
|
|
|
|
|
426
|
|
|
|
|
|
|
B<Local> minimum free energy of the basin (i.e. the minimum's energy). |
427
|
|
|
|
|
|
|
|
428
|
|
|
|
|
|
|
=head3 $min->father_index() |
429
|
|
|
|
|
|
|
|
430
|
|
|
|
|
|
|
Returns the index of the father minimum (i.e. the one this minimum has been |
431
|
|
|
|
|
|
|
merged to). |
432
|
|
|
|
|
|
|
|
433
|
|
|
|
|
|
|
=head3 $min->barrier_height() |
434
|
|
|
|
|
|
|
|
435
|
|
|
|
|
|
|
Returns the barrier height (B<relative> energy difference of the saddle point |
436
|
|
|
|
|
|
|
to the local minimum). For the B<absolute> energy of the saddle point, see |
437
|
|
|
|
|
|
|
C<saddle_height()>. |
438
|
|
|
|
|
|
|
|
439
|
|
|
|
|
|
|
=head3 $min->saddle_height() |
440
|
|
|
|
|
|
|
|
441
|
|
|
|
|
|
|
B<Absolute> energy of the lowest structure connecting this basin to another |
442
|
|
|
|
|
|
|
one. The barrier height, in contrast, is the B<relative> energy of the same |
443
|
|
|
|
|
|
|
structure w.r.t. to the basin's (local) mfe. |
444
|
|
|
|
|
|
|
|
445
|
|
|
|
|
|
|
B<Beware>: if the basin does not have a father (father == 0), then the |
446
|
|
|
|
|
|
|
reported saddle height is given with respect to the global exploration |
447
|
|
|
|
|
|
|
threshold. This is strange but consistent with original Barriers files. |
448
|
|
|
|
|
|
|
|
449
|
|
|
|
|
|
|
=head3 $min->global_saddle_height() |
450
|
|
|
|
|
|
|
|
451
|
|
|
|
|
|
|
Saddle height as described for saddle_height(), but not with respect to |
452
|
|
|
|
|
|
|
any neighbor minimum, but to the global mfe structure (basin 1). |
453
|
|
|
|
|
|
|
|
454
|
|
|
|
|
|
|
=head3 $min->saddle_struct() |
455
|
|
|
|
|
|
|
|
456
|
|
|
|
|
|
|
Returns the saddle structure via which it was merged to its father minimum. |
457
|
|
|
|
|
|
|
If this attribute was not set (i.e. I<Barriers> was run without the |
458
|
|
|
|
|
|
|
C<--saddle> option), it croaks when accessed. |
459
|
|
|
|
|
|
|
|
460
|
|
|
|
|
|
|
Use the C<has_saddle()> predicate to query the status of this attribute. |
461
|
|
|
|
|
|
|
|
462
|
|
|
|
|
|
|
=head3 $min->has_saddle_struct() |
463
|
|
|
|
|
|
|
|
464
|
|
|
|
|
|
|
Predicate for the C<saddle> attribute. True iff the minimum provides the |
465
|
|
|
|
|
|
|
saddle structure via which it was merged to its father minimum, as computed by |
466
|
|
|
|
|
|
|
the I<Barriers> option C<--saddle>. It can be queried via the C<saddle_struct> |
467
|
|
|
|
|
|
|
method. |
468
|
|
|
|
|
|
|
|
469
|
|
|
|
|
|
|
=head3 $min->father() |
470
|
|
|
|
|
|
|
|
471
|
|
|
|
|
|
|
Returns (a reference to) the father minimum object. |
472
|
|
|
|
|
|
|
|
473
|
|
|
|
|
|
|
=head3 $min->has_father() |
474
|
|
|
|
|
|
|
|
475
|
|
|
|
|
|
|
Returns true iff the minimum has a father minimum it has been merged to. |
476
|
|
|
|
|
|
|
|
477
|
|
|
|
|
|
|
=head3 $min->is_connected() |
478
|
|
|
|
|
|
|
|
479
|
|
|
|
|
|
|
Boolean. True iff the minimum is connected to basin 1 (the mfe basin). |
480
|
|
|
|
|
|
|
|
481
|
|
|
|
|
|
|
=head3 $min->ancestors() |
482
|
|
|
|
|
|
|
|
483
|
|
|
|
|
|
|
Determine all ancestor minima of this minimum, i.e. this minimum's father, |
484
|
|
|
|
|
|
|
grand father, grand grand father etc. in this order. |
485
|
|
|
|
|
|
|
|
486
|
|
|
|
|
|
|
=head3 $min->stringify() |
487
|
|
|
|
|
|
|
|
488
|
|
|
|
|
|
|
Stringify minimum to equal an entry line in the barriers output file. |
489
|
|
|
|
|
|
|
Format strings are taken from Barriers' C source code. |
490
|
|
|
|
|
|
|
|
491
|
|
|
|
|
|
|
=head3 $min->brief() |
492
|
|
|
|
|
|
|
|
493
|
|
|
|
|
|
|
Stringification method returning a more brief representation of the |
494
|
|
|
|
|
|
|
minimum containing only the index, min struct, its energy, the father's |
495
|
|
|
|
|
|
|
index, and the barrier height. This equals the output of Barriers if |
496
|
|
|
|
|
|
|
neither C<--bsize> nor C<--saddle> is given. |
497
|
|
|
|
|
|
|
|
498
|
|
|
|
|
|
|
|
499
|
|
|
|
|
|
|
=head1 AUTHOR |
500
|
|
|
|
|
|
|
|
501
|
|
|
|
|
|
|
Felix Kuehnl, C<< <felix at bioinf.uni-leipzig.de> >> |
502
|
|
|
|
|
|
|
|
503
|
|
|
|
|
|
|
=head1 BUGS |
504
|
|
|
|
|
|
|
|
505
|
|
|
|
|
|
|
Please report any bugs or feature requests by raising an issue at |
506
|
|
|
|
|
|
|
L<https://github.com/xileF1337/Bio-RNA-Barriers/issues>. |
507
|
|
|
|
|
|
|
|
508
|
|
|
|
|
|
|
You can also do so by mailing to C<bug-bio-rna-barmap at rt.cpan.org>, |
509
|
|
|
|
|
|
|
or through the web interface at |
510
|
|
|
|
|
|
|
L<https://rt.cpan.org/NoAuth/ReportBug.html?Queue=Bio-RNA-BarMap>. I will be |
511
|
|
|
|
|
|
|
notified, and then you'll automatically be notified of progress on your bug as |
512
|
|
|
|
|
|
|
I make changes. |
513
|
|
|
|
|
|
|
|
514
|
|
|
|
|
|
|
|
515
|
|
|
|
|
|
|
=head1 SUPPORT |
516
|
|
|
|
|
|
|
|
517
|
|
|
|
|
|
|
You can find documentation for this module with the perldoc command. |
518
|
|
|
|
|
|
|
|
519
|
|
|
|
|
|
|
perldoc Bio::RNA::Barriers |
520
|
|
|
|
|
|
|
|
521
|
|
|
|
|
|
|
|
522
|
|
|
|
|
|
|
You can also look for information at the official Barriers website: |
523
|
|
|
|
|
|
|
|
524
|
|
|
|
|
|
|
L<https://www.tbi.univie.ac.at/RNA/Barriers/> |
525
|
|
|
|
|
|
|
|
526
|
|
|
|
|
|
|
|
527
|
|
|
|
|
|
|
=over 4 |
528
|
|
|
|
|
|
|
|
529
|
|
|
|
|
|
|
=item * Github: the official repository |
530
|
|
|
|
|
|
|
|
531
|
|
|
|
|
|
|
L<https://github.com/xileF1337/Bio-RNA-Barriers> |
532
|
|
|
|
|
|
|
|
533
|
|
|
|
|
|
|
|
534
|
|
|
|
|
|
|
=item * RT: CPAN's request tracker (report bugs here) |
535
|
|
|
|
|
|
|
|
536
|
|
|
|
|
|
|
L<https://rt.cpan.org/NoAuth/Bugs.html?Dist=Bio-RNA-Barriers> |
537
|
|
|
|
|
|
|
|
538
|
|
|
|
|
|
|
=item * AnnoCPAN: Annotated CPAN documentation |
539
|
|
|
|
|
|
|
|
540
|
|
|
|
|
|
|
L<http://annocpan.org/dist/Bio-RNA-Barriers> |
541
|
|
|
|
|
|
|
|
542
|
|
|
|
|
|
|
=item * CPAN Ratings |
543
|
|
|
|
|
|
|
|
544
|
|
|
|
|
|
|
L<https://cpanratings.perl.org/d/Bio-RNA-Barriers> |
545
|
|
|
|
|
|
|
|
546
|
|
|
|
|
|
|
=item * Search CPAN |
547
|
|
|
|
|
|
|
|
548
|
|
|
|
|
|
|
L<https://metacpan.org/release/Bio-RNA-Barriers> |
549
|
|
|
|
|
|
|
|
550
|
|
|
|
|
|
|
=back |
551
|
|
|
|
|
|
|
|
552
|
|
|
|
|
|
|
|
553
|
|
|
|
|
|
|
=head1 LICENSE AND COPYRIGHT |
554
|
|
|
|
|
|
|
|
555
|
|
|
|
|
|
|
Copyright 2019-2021 Felix Kuehnl. |
556
|
|
|
|
|
|
|
|
557
|
|
|
|
|
|
|
This program is free software: you can redistribute it and/or modify |
558
|
|
|
|
|
|
|
it under the terms of the GNU General Public License as published by |
559
|
|
|
|
|
|
|
the Free Software Foundation, either version 3 of the License, or |
560
|
|
|
|
|
|
|
(at your option) any later version. |
561
|
|
|
|
|
|
|
|
562
|
|
|
|
|
|
|
This program is distributed in the hope that it will be useful, |
563
|
|
|
|
|
|
|
but WITHOUT ANY WARRANTY; without even the implied warranty of |
564
|
|
|
|
|
|
|
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the |
565
|
|
|
|
|
|
|
GNU General Public License for more details. |
566
|
|
|
|
|
|
|
|
567
|
|
|
|
|
|
|
You should have received a copy of the GNU General Public License |
568
|
|
|
|
|
|
|
along with this program. If not, see L<http://www.gnu.org/licenses/>. |
569
|
|
|
|
|
|
|
|
570
|
|
|
|
|
|
|
|
571
|
|
|
|
|
|
|
=cut |
572
|
|
|
|
|
|
|
|
573
|
|
|
|
|
|
|
|
574
|
|
|
|
|
|
|
# End of Bio::RNA::Barriers::Minimum |