line |
stmt |
bran |
cond |
sub |
pod |
time |
code |
1
|
|
|
|
|
|
|
# Bio::Tools::Alignment::Trim.pm |
2
|
|
|
|
|
|
|
# |
3
|
|
|
|
|
|
|
# Please direct questions and support issues to |
4
|
|
|
|
|
|
|
# |
5
|
|
|
|
|
|
|
# Cared for by Chad Matsalla |
6
|
|
|
|
|
|
|
# |
7
|
|
|
|
|
|
|
# Copyright Chad Matsalla |
8
|
|
|
|
|
|
|
# |
9
|
|
|
|
|
|
|
# You may distribute this module under the same terms as perl itself |
10
|
|
|
|
|
|
|
|
11
|
|
|
|
|
|
|
# POD documentation - main docs before the code |
12
|
|
|
|
|
|
|
|
13
|
|
|
|
|
|
|
=head1 NAME |
14
|
|
|
|
|
|
|
|
15
|
|
|
|
|
|
|
Bio::Tools::Alignment::Trim - A kludge to do specialized trimming of |
16
|
|
|
|
|
|
|
sequence based on quality. |
17
|
|
|
|
|
|
|
|
18
|
|
|
|
|
|
|
=head1 SYNOPSIS |
19
|
|
|
|
|
|
|
|
20
|
|
|
|
|
|
|
use Bio::Tools::Alignment::Trim; |
21
|
|
|
|
|
|
|
$o_trim = Bio::Tools::Alignment::Trim->new(); |
22
|
|
|
|
|
|
|
$o_trim->set_reverse_designator("R"); |
23
|
|
|
|
|
|
|
$o_trim->set_forward_designator("F"); |
24
|
|
|
|
|
|
|
|
25
|
|
|
|
|
|
|
|
26
|
|
|
|
|
|
|
=head1 DESCRIPTION |
27
|
|
|
|
|
|
|
|
28
|
|
|
|
|
|
|
This is a specialized module designed by Chad for Chad to trim sequences |
29
|
|
|
|
|
|
|
based on a highly specialized list of requirements. In other words, write |
30
|
|
|
|
|
|
|
something that will trim sequences 'just like the people in the lab would |
31
|
|
|
|
|
|
|
do manually'. |
32
|
|
|
|
|
|
|
|
33
|
|
|
|
|
|
|
I settled on a sliding-window-average style of search which is ugly and |
34
|
|
|
|
|
|
|
slow but does _exactly_ what I want it to do. |
35
|
|
|
|
|
|
|
|
36
|
|
|
|
|
|
|
Mental note: rewrite this. |
37
|
|
|
|
|
|
|
|
38
|
|
|
|
|
|
|
It is very important to keep in mind the context in which this module was |
39
|
|
|
|
|
|
|
written: strictly to support the projects for which Consed.pm was |
40
|
|
|
|
|
|
|
designed. |
41
|
|
|
|
|
|
|
|
42
|
|
|
|
|
|
|
=head1 FEEDBACK |
43
|
|
|
|
|
|
|
|
44
|
|
|
|
|
|
|
=head2 Mailing Lists |
45
|
|
|
|
|
|
|
|
46
|
|
|
|
|
|
|
User feedback is an integral part of the evolution of this and other |
47
|
|
|
|
|
|
|
Bioperl modules. Send your comments and suggestions preferably to one |
48
|
|
|
|
|
|
|
of the Bioperl mailing lists. Your participation is much appreciated. |
49
|
|
|
|
|
|
|
|
50
|
|
|
|
|
|
|
bioperl-l@bioperl.org - General discussion |
51
|
|
|
|
|
|
|
http://bioperl.org/wiki/Mailing_lists - About the mailing |
52
|
|
|
|
|
|
|
lists |
53
|
|
|
|
|
|
|
|
54
|
|
|
|
|
|
|
=head2 Support |
55
|
|
|
|
|
|
|
|
56
|
|
|
|
|
|
|
Please direct usage questions or support issues to the mailing list: |
57
|
|
|
|
|
|
|
|
58
|
|
|
|
|
|
|
I |
59
|
|
|
|
|
|
|
|
60
|
|
|
|
|
|
|
rather than to the module maintainer directly. Many experienced and |
61
|
|
|
|
|
|
|
reponsive experts will be able look at the problem and quickly |
62
|
|
|
|
|
|
|
address it. Please include a thorough description of the problem |
63
|
|
|
|
|
|
|
with code and data examples if at all possible. |
64
|
|
|
|
|
|
|
|
65
|
|
|
|
|
|
|
=head2 Reporting Bugs |
66
|
|
|
|
|
|
|
|
67
|
|
|
|
|
|
|
Report bugs to the Bioperl bug tracking system to help us keep track |
68
|
|
|
|
|
|
|
the bugs and their resolution. Bug reports can be submitted via the |
69
|
|
|
|
|
|
|
web: |
70
|
|
|
|
|
|
|
|
71
|
|
|
|
|
|
|
https://github.com/bioperl/bioperl-live/issues |
72
|
|
|
|
|
|
|
|
73
|
|
|
|
|
|
|
=head1 AUTHOR - Chad Matsalla |
74
|
|
|
|
|
|
|
|
75
|
|
|
|
|
|
|
Email bioinformatics-at-dieselwurks.com |
76
|
|
|
|
|
|
|
|
77
|
|
|
|
|
|
|
=head1 APPENDIX |
78
|
|
|
|
|
|
|
|
79
|
|
|
|
|
|
|
The rest of the documentation details each of the object methods. |
80
|
|
|
|
|
|
|
Internal methods are usually preceded with a _ |
81
|
|
|
|
|
|
|
|
82
|
|
|
|
|
|
|
=cut |
83
|
|
|
|
|
|
|
|
84
|
|
|
|
|
|
|
package Bio::Tools::Alignment::Trim; |
85
|
|
|
|
|
|
|
|
86
|
1
|
|
|
1
|
|
3
|
use strict; |
|
1
|
|
|
|
|
1
|
|
|
1
|
|
|
|
|
21
|
|
87
|
1
|
|
|
1
|
|
3
|
use Dumpvalue; |
|
1
|
|
|
|
|
1
|
|
|
1
|
|
|
|
|
15
|
|
88
|
|
|
|
|
|
|
|
89
|
1
|
|
|
1
|
|
2
|
use vars qw(%DEFAULTS); |
|
1
|
|
|
|
|
2
|
|
|
1
|
|
|
|
|
39
|
|
90
|
|
|
|
|
|
|
|
91
|
1
|
|
|
1
|
|
3
|
use base qw(Bio::Root::Root); |
|
1
|
|
|
|
|
1
|
|
|
1
|
|
|
|
|
283
|
|
92
|
|
|
|
|
|
|
|
93
|
|
|
|
|
|
|
BEGIN { |
94
|
1
|
|
|
1
|
|
1199
|
%DEFAULTS = ( 'f_designator' => 'f', |
95
|
|
|
|
|
|
|
'r_designator' => 'r', |
96
|
|
|
|
|
|
|
'windowsize' => '10', |
97
|
|
|
|
|
|
|
'phreds' => '20'); |
98
|
|
|
|
|
|
|
} |
99
|
|
|
|
|
|
|
|
100
|
|
|
|
|
|
|
=head2 new() |
101
|
|
|
|
|
|
|
|
102
|
|
|
|
|
|
|
Title : new() |
103
|
|
|
|
|
|
|
Usage : $o_trim = Bio::Tools::Alignment::Trim->new(); |
104
|
|
|
|
|
|
|
Function: Construct the Bio::Tools::Alignment::Trim object. No parameters |
105
|
|
|
|
|
|
|
are required to create this object. It is strictly a bundle of |
106
|
|
|
|
|
|
|
functions, as far as I am concerned. |
107
|
|
|
|
|
|
|
Returns : A reference to a Bio::Tools::Alignment::Trim object. |
108
|
|
|
|
|
|
|
Args : (optional) |
109
|
|
|
|
|
|
|
-windowsize (default 10) |
110
|
|
|
|
|
|
|
-phreds (default 20) |
111
|
|
|
|
|
|
|
|
112
|
|
|
|
|
|
|
|
113
|
|
|
|
|
|
|
=cut |
114
|
|
|
|
|
|
|
|
115
|
|
|
|
|
|
|
sub new { |
116
|
1
|
|
|
1
|
1
|
2
|
my ($class,@args) = @_; |
117
|
1
|
|
|
|
|
5
|
my $self = $class->SUPER::new(@args); |
118
|
1
|
|
|
|
|
4
|
my($windowsize,$phreds) = |
119
|
|
|
|
|
|
|
$self->_rearrange([qw( |
120
|
|
|
|
|
|
|
WINDOWSIZE |
121
|
|
|
|
|
|
|
PHREDS |
122
|
|
|
|
|
|
|
)], |
123
|
|
|
|
|
|
|
@args); |
124
|
1
|
|
33
|
|
|
5
|
$self->{windowsize} = $windowsize || $DEFAULTS{'windowsize'}; |
125
|
1
|
|
33
|
|
|
5
|
$self->{phreds} = $phreds || $DEFAULTS{'phreds'}; |
126
|
|
|
|
|
|
|
# print("Constructor set phreds to ".$self->{phreds}."\n") if $self->verbose > 0; |
127
|
|
|
|
|
|
|
$self->set_designators($DEFAULTS{'f_designator'}, |
128
|
1
|
|
|
|
|
3
|
$DEFAULTS{'r_designator'}); |
129
|
1
|
|
|
|
|
3
|
return $self; |
130
|
|
|
|
|
|
|
} |
131
|
|
|
|
|
|
|
|
132
|
|
|
|
|
|
|
=head2 set_designators($forward_designator,$reverse_designator) |
133
|
|
|
|
|
|
|
|
134
|
|
|
|
|
|
|
Title : set_designators(,) |
135
|
|
|
|
|
|
|
Usage : $o_trim->set_designators("F","R") |
136
|
|
|
|
|
|
|
Function: Set the string by which the system determines whether a given |
137
|
|
|
|
|
|
|
sequence represents a forward or a reverse read. |
138
|
|
|
|
|
|
|
Returns : Nothing. |
139
|
|
|
|
|
|
|
Args : two scalars: one representing the forward designator and one |
140
|
|
|
|
|
|
|
representing the reverse designator |
141
|
|
|
|
|
|
|
|
142
|
|
|
|
|
|
|
=cut |
143
|
|
|
|
|
|
|
|
144
|
|
|
|
|
|
|
sub set_designators { |
145
|
2
|
|
|
2
|
1
|
2
|
my $self = shift; |
146
|
2
|
|
|
|
|
7
|
($self->{'f_designator'},$self->{'r_designator'}) = @_; |
147
|
|
|
|
|
|
|
} |
148
|
|
|
|
|
|
|
|
149
|
|
|
|
|
|
|
=head2 set_forward_designator($designator) |
150
|
|
|
|
|
|
|
|
151
|
|
|
|
|
|
|
Title : set_forward_designator($designator) |
152
|
|
|
|
|
|
|
Usage : $o_trim->set_forward_designator("F") |
153
|
|
|
|
|
|
|
Function: Set the string by which the system determines if a given |
154
|
|
|
|
|
|
|
sequence is a forward read. |
155
|
|
|
|
|
|
|
Returns : Nothing. |
156
|
|
|
|
|
|
|
Args : A string representing the forward designator of this project. |
157
|
|
|
|
|
|
|
|
158
|
|
|
|
|
|
|
=cut |
159
|
|
|
|
|
|
|
|
160
|
|
|
|
|
|
|
sub set_forward_designator { |
161
|
1
|
|
|
1
|
1
|
1
|
my ($self,$desig) = @_; |
162
|
1
|
|
|
|
|
1
|
$self->{'f_designator'} = $desig; |
163
|
|
|
|
|
|
|
} |
164
|
|
|
|
|
|
|
|
165
|
|
|
|
|
|
|
=head2 set_reverse_designator($reverse_designator) |
166
|
|
|
|
|
|
|
|
167
|
|
|
|
|
|
|
Title : set_reverse_designator($reverse_designator) |
168
|
|
|
|
|
|
|
Function: Set the string by which the system determines if a given |
169
|
|
|
|
|
|
|
sequence is a reverse read. |
170
|
|
|
|
|
|
|
Usage : $o_trim->set_reverse_designator("R") |
171
|
|
|
|
|
|
|
Returns : Nothing. |
172
|
|
|
|
|
|
|
Args : A string representing the forward designator of this project. |
173
|
|
|
|
|
|
|
|
174
|
|
|
|
|
|
|
=cut |
175
|
|
|
|
|
|
|
|
176
|
|
|
|
|
|
|
sub set_reverse_designator { |
177
|
1
|
|
|
1
|
1
|
1
|
my ($self,$desig) = @_; |
178
|
1
|
|
|
|
|
1
|
$self->{'r_designator'} = $desig; |
179
|
|
|
|
|
|
|
} |
180
|
|
|
|
|
|
|
|
181
|
|
|
|
|
|
|
=head2 get_designators() |
182
|
|
|
|
|
|
|
|
183
|
|
|
|
|
|
|
Title : get_designators() |
184
|
|
|
|
|
|
|
Usage : $o_trim->get_designators() |
185
|
|
|
|
|
|
|
Returns : A string describing the current designators. |
186
|
|
|
|
|
|
|
Args : None |
187
|
|
|
|
|
|
|
Notes : Really for informational purposes only. Duh. |
188
|
|
|
|
|
|
|
|
189
|
|
|
|
|
|
|
=cut |
190
|
|
|
|
|
|
|
|
191
|
|
|
|
|
|
|
sub get_designators { |
192
|
0
|
|
|
0
|
1
|
|
my $self = shift; |
193
|
0
|
|
|
|
|
|
return("forward: ".$self->{'f_designator'}." reverse: ".$self->{'r_designator'}); |
194
|
|
|
|
|
|
|
} |
195
|
|
|
|
|
|
|
|
196
|
|
|
|
|
|
|
=head2 trim_leading_polys() |
197
|
|
|
|
|
|
|
|
198
|
|
|
|
|
|
|
Title : trim_leading_polys() |
199
|
|
|
|
|
|
|
Usage : $o_trim->trim_leading_polys() |
200
|
|
|
|
|
|
|
Function: Not implemented. Does nothing. |
201
|
|
|
|
|
|
|
Returns : Nothing. |
202
|
|
|
|
|
|
|
Args : None. |
203
|
|
|
|
|
|
|
Notes : This function is not implemented. Part of something I wanted to |
204
|
|
|
|
|
|
|
do but never got around to doing. |
205
|
|
|
|
|
|
|
|
206
|
|
|
|
|
|
|
=cut |
207
|
|
|
|
|
|
|
|
208
|
|
|
|
|
|
|
sub trim_leading_polys { |
209
|
0
|
|
|
0
|
1
|
|
my ($self, $sequence) = @_; |
210
|
|
|
|
|
|
|
} |
211
|
|
|
|
|
|
|
|
212
|
|
|
|
|
|
|
=head2 dump_hash() |
213
|
|
|
|
|
|
|
|
214
|
|
|
|
|
|
|
Title : dump_hash() |
215
|
|
|
|
|
|
|
Usage : $o_trim->dump_hash() |
216
|
|
|
|
|
|
|
Function: Unimplemented. |
217
|
|
|
|
|
|
|
Returns : Nothing. |
218
|
|
|
|
|
|
|
Args : None. |
219
|
|
|
|
|
|
|
Notes : Does nothing. |
220
|
|
|
|
|
|
|
|
221
|
|
|
|
|
|
|
=cut |
222
|
|
|
|
|
|
|
|
223
|
|
|
|
|
|
|
sub dump_hash { |
224
|
0
|
|
|
0
|
1
|
|
my $self = shift; |
225
|
0
|
|
|
|
|
|
my %hash = %{$self->{'qualities'}}; |
|
0
|
|
|
|
|
|
|
226
|
|
|
|
|
|
|
} # end dump_hash |
227
|
|
|
|
|
|
|
|
228
|
|
|
|
|
|
|
=head2 trim_singlet($sequence,$quality,$name,$class) |
229
|
|
|
|
|
|
|
|
230
|
|
|
|
|
|
|
Title : trim_singlet($sequence,$quality,$name,$class) |
231
|
|
|
|
|
|
|
Usage : ($r_trim_points,$trimmed_sequence) = |
232
|
|
|
|
|
|
|
@{$o_trim->trim_singlet($sequence,$quality,$name,$class)}; |
233
|
|
|
|
|
|
|
Function: Trim a singlet based on its quality. |
234
|
|
|
|
|
|
|
Returns : a reference to an array containing the forward and reverse |
235
|
|
|
|
|
|
|
trim points and the trimmed sequence. |
236
|
|
|
|
|
|
|
Args : $sequence : A sequence (SCALAR, please) |
237
|
|
|
|
|
|
|
$quality : A _scalar_ of space-delimited quality values. |
238
|
|
|
|
|
|
|
$name : the name of the sequence |
239
|
|
|
|
|
|
|
$class : The class of the sequence. One of qw(singlet |
240
|
|
|
|
|
|
|
singleton doublet pair multiplet) |
241
|
|
|
|
|
|
|
Notes : At the time this was written the bioperl objects SeqWithQuality |
242
|
|
|
|
|
|
|
and PrimaryQual did not exist. This is what is with the clumsy |
243
|
|
|
|
|
|
|
passing of references and so on. I will rewrite this next time I |
244
|
|
|
|
|
|
|
have to work with it. I also wasn't sure whether this function |
245
|
|
|
|
|
|
|
should return just the trim points or the points and the sequence. |
246
|
|
|
|
|
|
|
I decided that I always wanted both so that's how I implemented |
247
|
|
|
|
|
|
|
it. |
248
|
|
|
|
|
|
|
- Note that the size of the sliding windows is set during construction of |
249
|
|
|
|
|
|
|
the Bio::Tools::Alignment::Trim object. |
250
|
|
|
|
|
|
|
|
251
|
|
|
|
|
|
|
=cut |
252
|
|
|
|
|
|
|
|
253
|
|
|
|
|
|
|
sub trim_singlet { |
254
|
0
|
|
|
0
|
1
|
|
my ($self,$sequence,$quality,$name,$class) = @_; |
255
|
|
|
|
|
|
|
# this split is done because I normally store quality values in a |
256
|
|
|
|
|
|
|
# space-delimited scalar rather then in an array. |
257
|
|
|
|
|
|
|
# I do this because serialization of the arrays is tough. |
258
|
0
|
|
|
|
|
|
my @qual = split(' ',$quality); |
259
|
0
|
|
|
|
|
|
my @points; |
260
|
0
|
|
|
|
|
|
my $sequence_length = length($sequence); |
261
|
0
|
|
|
|
|
|
my ($returnstring,$processed_sequence); |
262
|
|
|
|
|
|
|
# smooth out the qualities |
263
|
0
|
|
|
|
|
|
my $r_windows = &_sliding_window(\@qual,$self->{windowsize}); |
264
|
|
|
|
|
|
|
# find out the leading and trailing trimpoints |
265
|
0
|
|
|
|
|
|
my $start_base = $self->_get_start($r_windows,$self->{windowsize},$self->{phreds}); |
266
|
0
|
|
|
|
|
|
my (@new_points,$trimmed_sequence); |
267
|
|
|
|
|
|
|
# do you think that any sequence shorter then 100 should be |
268
|
|
|
|
|
|
|
# discarded? I don't think that this should be the decision of this |
269
|
|
|
|
|
|
|
# module. |
270
|
|
|
|
|
|
|
# removed, 020926 |
271
|
0
|
|
|
|
|
|
$points[0] = $start_base; |
272
|
|
|
|
|
|
|
# whew! now for the end base |
273
|
|
|
|
|
|
|
# required parameters: reference_to_windows,windowsize,$phredvalue,start_base |
274
|
|
|
|
|
|
|
my $end_base = &_get_end($r_windows,$self->{windowsize}, |
275
|
0
|
|
|
|
|
|
$self->{phreds},$start_base); |
276
|
0
|
|
|
|
|
|
$points[1] = $end_base; |
277
|
|
|
|
|
|
|
# now do the actual trimming |
278
|
|
|
|
|
|
|
# CHAD : I don't think that it is a good idea to call chop_sequence here |
279
|
|
|
|
|
|
|
# because chop_sequence also removes X's and N's and things |
280
|
|
|
|
|
|
|
# and that is not always what is wanted |
281
|
0
|
|
|
|
|
|
return \@points; |
282
|
|
|
|
|
|
|
} |
283
|
|
|
|
|
|
|
|
284
|
|
|
|
|
|
|
=head2 trim_doublet($sequence,$quality,$name,$class) |
285
|
|
|
|
|
|
|
|
286
|
|
|
|
|
|
|
Title : trim_doublet($sequence,$quality,$name,$class) |
287
|
|
|
|
|
|
|
Usage : ($r_trim_points,$trimmed_sequence) = |
288
|
|
|
|
|
|
|
@{$o_trim->trim_singlet($sequence,$quality,$name,$class)}; |
289
|
|
|
|
|
|
|
Function: Trim a singlet based on its quality. |
290
|
|
|
|
|
|
|
Returns : a reference to an array containing the forward and reverse |
291
|
|
|
|
|
|
|
Args : $sequence : A sequence |
292
|
|
|
|
|
|
|
$quality : A _scalar_ of space-delimited quality values. |
293
|
|
|
|
|
|
|
$name : the name of the sequence |
294
|
|
|
|
|
|
|
$class : The class of the sequence. One of qw(singlet |
295
|
|
|
|
|
|
|
singleton doublet pair multiplet) |
296
|
|
|
|
|
|
|
Notes : At the time this was written the bioperl objects SeqWithQuality |
297
|
|
|
|
|
|
|
and PrimaryQual did not exist. This is what is with the clumsy |
298
|
|
|
|
|
|
|
passing of references and so on. I will rewrite this next time I |
299
|
|
|
|
|
|
|
have to work with it. I also wasn't sure whether this function |
300
|
|
|
|
|
|
|
should return just the trim points or the points and the sequence. |
301
|
|
|
|
|
|
|
I decided that I always wanted both so that's how I implemented |
302
|
|
|
|
|
|
|
it. |
303
|
|
|
|
|
|
|
|
304
|
|
|
|
|
|
|
=cut |
305
|
|
|
|
|
|
|
|
306
|
|
|
|
|
|
|
#' |
307
|
|
|
|
|
|
|
sub trim_doublet { |
308
|
0
|
|
|
0
|
1
|
|
my ($self,$sequence,$quality,$name,$class) = @_; |
309
|
0
|
|
|
|
|
|
my @qual = split(' ',$quality); |
310
|
0
|
|
|
|
|
|
my @points; |
311
|
0
|
|
|
|
|
|
my $sequence_length = length($sequence); |
312
|
0
|
|
|
|
|
|
my ($returnstring,$processed_sequence); |
313
|
|
|
|
|
|
|
# smooth out the qualities |
314
|
0
|
|
|
|
|
|
my $r_windows = &_sliding_window(\@qual,$self->{windowsize}); |
315
|
|
|
|
|
|
|
# determine where the consensus sequence starts |
316
|
0
|
|
|
|
|
|
my $offset = 0; |
317
|
0
|
|
|
|
|
|
for (my $current = 0; $current<$sequence_length;$current++) { |
318
|
0
|
0
|
|
|
|
|
if ($qual[$current] != 0) { |
319
|
0
|
|
|
|
|
|
$offset = $current; |
320
|
0
|
|
|
|
|
|
last; |
321
|
|
|
|
|
|
|
} |
322
|
|
|
|
|
|
|
} |
323
|
|
|
|
|
|
|
# start_base required: r_quality,$windowsize,$phredvalue |
324
|
0
|
|
|
|
|
|
my $start_base = $self->_get_start($r_windows,$self->{windowsize},$self->{phreds},$offset); |
325
|
0
|
0
|
|
|
|
|
if ($start_base > ($sequence_length - 100)) { |
326
|
0
|
|
|
|
|
|
$points[0] = ("FAILED"); |
327
|
0
|
|
|
|
|
|
$points[1] = ("FAILED"); |
328
|
0
|
|
|
|
|
|
return @points; |
329
|
|
|
|
|
|
|
} |
330
|
0
|
|
|
|
|
|
$points[0] = $start_base; |
331
|
|
|
|
|
|
|
# |
332
|
|
|
|
|
|
|
# whew! now for the end base |
333
|
|
|
|
|
|
|
# |
334
|
|
|
|
|
|
|
# required parameters: reference_to_windows,windowsize,$phredvalue,start_base |
335
|
|
|
|
|
|
|
# | |
336
|
|
|
|
|
|
|
# 010420 NOTE: We will no longer get the end base to avoid the Q/--\___/-- syndrome |
337
|
0
|
|
|
|
|
|
my $end_base = $sequence_length; |
338
|
0
|
|
|
|
|
|
my $start_of_trailing_zeros = &count_doublet_trailing_zeros(\@qual); |
339
|
0
|
|
|
|
|
|
$points[1] = $end_base; |
340
|
|
|
|
|
|
|
# CHAD : I don't think that it is a good idea to call chop_sequence here |
341
|
|
|
|
|
|
|
# because chop_sequence also removes X's and N's and things |
342
|
|
|
|
|
|
|
# and that is not always what is wanted |
343
|
0
|
|
|
|
|
|
return @points; |
344
|
|
|
|
|
|
|
} # end trim_doublet |
345
|
|
|
|
|
|
|
|
346
|
|
|
|
|
|
|
=head2 chop_sequence($name,$class,$sequence,@points) |
347
|
|
|
|
|
|
|
|
348
|
|
|
|
|
|
|
Title : chop_sequence($name,$class,$sequence,@points) |
349
|
|
|
|
|
|
|
Usage : ($start_point,$end_point,$chopped_sequence) = |
350
|
|
|
|
|
|
|
$o_trim->chop_sequence($name,$class,$sequence,@points); |
351
|
|
|
|
|
|
|
Function: Chop a sequence based on its name, class, and sequence. |
352
|
|
|
|
|
|
|
Returns : an array containing three scalars: |
353
|
|
|
|
|
|
|
1- the start trim point |
354
|
|
|
|
|
|
|
2- the end trim point |
355
|
|
|
|
|
|
|
3- the chopped sequence |
356
|
|
|
|
|
|
|
Args : |
357
|
|
|
|
|
|
|
$name : the name of the sequence |
358
|
|
|
|
|
|
|
$class : The class of the sequence. One of qw(singlet |
359
|
|
|
|
|
|
|
singleton doublet pair multiplet) |
360
|
|
|
|
|
|
|
$sequence : A sequence |
361
|
|
|
|
|
|
|
@points : An array containing two elements- the first contains |
362
|
|
|
|
|
|
|
the start trim point and the second conatines the end trim |
363
|
|
|
|
|
|
|
point. |
364
|
|
|
|
|
|
|
|
365
|
|
|
|
|
|
|
=cut |
366
|
|
|
|
|
|
|
|
367
|
|
|
|
|
|
|
sub chop_sequence { |
368
|
0
|
|
|
0
|
1
|
|
my ($self,$name,$class,$sequence,@points) = @_; |
369
|
0
|
|
|
|
|
|
print("Coming into chop_sequence, \@points are @points\n"); |
370
|
0
|
|
|
|
|
|
my $fdesig = $self->{'f_designator'}; |
371
|
0
|
|
|
|
|
|
my $rdesig = $self->{'r_designator'}; |
372
|
0
|
0
|
0
|
|
|
|
if (!$points[0] && !$points[1]) { |
373
|
0
|
|
|
|
|
|
$sequence = "junk"; |
374
|
0
|
|
|
|
|
|
return $sequence; |
375
|
|
|
|
|
|
|
} |
376
|
0
|
0
|
0
|
|
|
|
if ($class eq "singlet" && $name =~ /$fdesig$/) { |
|
|
0
|
0
|
|
|
|
|
|
|
0
|
0
|
|
|
|
|
|
|
0
|
0
|
|
|
|
|
|
|
0
|
|
|
|
|
|
377
|
0
|
|
|
|
|
|
$sequence = substr($sequence,$points[0],$points[1]-$points[0]); |
378
|
|
|
|
|
|
|
} |
379
|
|
|
|
|
|
|
elsif ($class eq "singlet" && $name =~ /$rdesig$/) { |
380
|
0
|
|
|
|
|
|
$sequence = substr($sequence,$points[0],$points[1]-$points[0]); |
381
|
|
|
|
|
|
|
} |
382
|
|
|
|
|
|
|
elsif ($class eq "singleton" && $name =~ /$fdesig$/) { |
383
|
0
|
|
|
|
|
|
$sequence = substr($sequence,$points[0],$points[1]-$points[0]); |
384
|
|
|
|
|
|
|
} |
385
|
|
|
|
|
|
|
elsif ($class eq "singleton" && $name =~ /$rdesig$/) { |
386
|
0
|
|
|
|
|
|
$sequence = substr($sequence,$points[0],$points[1]-$points[0]); |
387
|
|
|
|
|
|
|
} |
388
|
|
|
|
|
|
|
elsif ($class eq "doublet") { |
389
|
0
|
|
|
|
|
|
$sequence = substr($sequence,$points[0],$points[1]-$points[0]); |
390
|
|
|
|
|
|
|
} |
391
|
|
|
|
|
|
|
# this is a _terrible_ to do this! i couldn't seem to find a better way |
392
|
|
|
|
|
|
|
# i thought something like s/(^.*[Xx]{5,})//g; might work, but no go |
393
|
|
|
|
|
|
|
# no time to find a fix! |
394
|
0
|
|
|
|
|
|
my $length_before_trimming = length($sequence); |
395
|
0
|
|
|
|
|
|
my $subs_Xs = $sequence =~ s/^.*[Xx]{5,}//g; |
396
|
0
|
0
|
|
|
|
|
if ($subs_Xs) { |
397
|
0
|
|
|
|
|
|
my $length_after_trimming = length($sequence); |
398
|
0
|
|
|
|
|
|
my $number_Xs_trimmed = $length_before_trimming - $length_after_trimming; |
399
|
0
|
|
|
|
|
|
$points[0] += $number_Xs_trimmed; |
400
|
|
|
|
|
|
|
} |
401
|
0
|
|
|
|
|
|
$length_before_trimming = length($sequence); |
402
|
0
|
|
|
|
|
|
my $subs_Ns = $sequence =~ s/[Nn]{1,}$//g; |
403
|
0
|
0
|
|
|
|
|
if ($subs_Ns) { |
404
|
0
|
|
|
|
|
|
my $length_after_trimming = length($sequence); |
405
|
0
|
|
|
|
|
|
my $number_Ns_trimmed = $length_before_trimming - $length_after_trimming; |
406
|
0
|
|
|
|
|
|
$points[1] -= $number_Ns_trimmed; |
407
|
0
|
|
|
|
|
|
$points[1] -= 1; |
408
|
|
|
|
|
|
|
} |
409
|
0
|
|
|
|
|
|
push @points,$sequence; |
410
|
0
|
|
|
|
|
|
print("chop_sequence \@points are @points\n"); |
411
|
0
|
|
|
|
|
|
return @points; |
412
|
|
|
|
|
|
|
} |
413
|
|
|
|
|
|
|
|
414
|
|
|
|
|
|
|
=head2 _get_start($r_quals,$windowsize,$phreds,$offset) |
415
|
|
|
|
|
|
|
|
416
|
|
|
|
|
|
|
Title : _get_start($r_quals,$windowsize,$phreds,$offset) |
417
|
|
|
|
|
|
|
Usage : $start_base = $self->_get_start($r_windows,5,20); |
418
|
|
|
|
|
|
|
Function: Provide the start trim point for this sequence. |
419
|
|
|
|
|
|
|
Returns : a scalar representing the start of the sequence |
420
|
|
|
|
|
|
|
Args : |
421
|
|
|
|
|
|
|
$r_quals : A reference to an array containing quality values. In |
422
|
|
|
|
|
|
|
context, this array of values has been smoothed by then |
423
|
|
|
|
|
|
|
sliding window-look ahead algorithm. |
424
|
|
|
|
|
|
|
$windowsize : The size of the window used when the sliding window |
425
|
|
|
|
|
|
|
look-ahead average was calculated. |
426
|
|
|
|
|
|
|
$phreds : |
427
|
|
|
|
|
|
|
$offset : |
428
|
|
|
|
|
|
|
|
429
|
|
|
|
|
|
|
=cut |
430
|
|
|
|
|
|
|
|
431
|
|
|
|
|
|
|
sub _get_start { |
432
|
0
|
|
|
0
|
|
|
my ($self,$r_quals,$windowsize,$phreds,$offset) = @_; |
433
|
0
|
0
|
|
|
|
|
print("Using $phreds phreds\n") if $self->verbose > 0; |
434
|
|
|
|
|
|
|
# this is to help determine whether the sequence is good at all |
435
|
0
|
|
|
|
|
|
my @quals = @$r_quals; |
436
|
0
|
|
|
|
|
|
my ($count,$count2,$qualsum); |
437
|
0
|
0
|
|
|
|
|
if ($offset) { $count = $offset; } else { $count = 0; } |
|
0
|
|
|
|
|
|
|
|
0
|
|
|
|
|
|
|
438
|
|
|
|
|
|
|
# search along the length of the sequence |
439
|
0
|
|
|
|
|
|
for (; ($count+$windowsize) <= scalar(@quals); $count++) { |
440
|
|
|
|
|
|
|
# sum all of the quality values in this window. |
441
|
0
|
|
|
|
|
|
my $cumulative=0; |
442
|
0
|
|
|
|
|
|
for($count2 = $count; $count2 < $count+$windowsize; $count2++) { |
443
|
0
|
0
|
|
|
|
|
if (!$quals[$count2]) { |
444
|
|
|
|
|
|
|
# print("Quals don't exist here!\n"); |
445
|
|
|
|
|
|
|
} |
446
|
|
|
|
|
|
|
else { |
447
|
0
|
|
|
|
|
|
$qualsum += $quals[$count2]; |
448
|
|
|
|
|
|
|
# print("Incremented qualsum to ($qualsum)\n"); |
449
|
|
|
|
|
|
|
} |
450
|
0
|
|
|
|
|
|
$cumulative++; |
451
|
|
|
|
|
|
|
} |
452
|
|
|
|
|
|
|
# print("The sum of this window (starting at $count) is $qualsum. I counted $cumulative bases.\n"); |
453
|
|
|
|
|
|
|
# if the total of windowsize * phreds is |
454
|
0
|
0
|
0
|
|
|
|
if ($qualsum && $qualsum >= $windowsize*$phreds) { return $count; } |
|
0
|
|
|
|
|
|
|
455
|
0
|
|
|
|
|
|
$qualsum = 0; |
456
|
|
|
|
|
|
|
} |
457
|
|
|
|
|
|
|
# if ($count > scalar(@quals)-$windowsize) { return; } |
458
|
0
|
|
|
|
|
|
return $count; |
459
|
|
|
|
|
|
|
} |
460
|
|
|
|
|
|
|
|
461
|
|
|
|
|
|
|
=head2 _get_end($r_qual,$windowsize,$phreds,$count) |
462
|
|
|
|
|
|
|
|
463
|
|
|
|
|
|
|
Title : _get_end($r_qual,$windowsize,$phreds,$count) |
464
|
|
|
|
|
|
|
Usage : my $end_base = &_get_end($r_windows,20,20,$start_base); |
465
|
|
|
|
|
|
|
Function: Get the end trim point for this sequence. |
466
|
|
|
|
|
|
|
Returns : A scalar representing the end trim point for this sequence. |
467
|
|
|
|
|
|
|
Args : |
468
|
|
|
|
|
|
|
$r_qual : A reference to an array containing quality values. In |
469
|
|
|
|
|
|
|
context, this array of values has been smoothed by then |
470
|
|
|
|
|
|
|
sliding window-look ahead algorithm. |
471
|
|
|
|
|
|
|
$windowsize : The size of the window used when the sliding window |
472
|
|
|
|
|
|
|
look-ahead average was calculated. |
473
|
|
|
|
|
|
|
$phreds : |
474
|
|
|
|
|
|
|
$count : Start looking for the end of the sequence here. |
475
|
|
|
|
|
|
|
|
476
|
|
|
|
|
|
|
=cut |
477
|
|
|
|
|
|
|
|
478
|
|
|
|
|
|
|
sub _get_end { |
479
|
0
|
|
|
0
|
|
|
my ($r_qual,$windowsize,$phreds,$count) = @_; |
480
|
0
|
|
|
|
|
|
my @quals = @$r_qual; |
481
|
0
|
|
|
|
|
|
my $total_bases = scalar(@quals); |
482
|
0
|
|
|
|
|
|
my ($count2,$qualsum,$end_of_quals,$bases_counted); |
483
|
0
|
0
|
|
|
|
|
if (!$count) { $count=0; } |
|
0
|
|
|
|
|
|
|
484
|
0
|
|
|
|
|
|
BASE: for (; $count < $total_bases; $count++) { |
485
|
0
|
|
|
|
|
|
$bases_counted = 0; |
486
|
0
|
|
|
|
|
|
$qualsum = 0; |
487
|
0
|
|
|
|
|
|
POSITION: for($count2 = $count; $count2 < $total_bases; $count2++) { |
488
|
0
|
|
|
|
|
|
$bases_counted++; |
489
|
|
|
|
|
|
|
|
490
|
0
|
0
|
|
|
|
|
if ($count2 == $total_bases-1) { |
|
|
0
|
|
|
|
|
|
491
|
0
|
|
|
|
|
|
$qualsum += $quals[$count2]; |
492
|
0
|
|
|
|
|
|
$bases_counted++; |
493
|
0
|
|
|
|
|
|
last BASE; |
494
|
|
|
|
|
|
|
} |
495
|
|
|
|
|
|
|
elsif ($bases_counted == $windowsize) { |
496
|
0
|
|
|
|
|
|
$qualsum += $quals[$count2]; |
497
|
0
|
0
|
|
|
|
|
if ($qualsum < $bases_counted*$phreds) { |
498
|
0
|
|
|
|
|
|
return $count+$bases_counted+$windowsize; |
499
|
|
|
|
|
|
|
} |
500
|
0
|
|
|
|
|
|
next BASE; |
501
|
|
|
|
|
|
|
} |
502
|
|
|
|
|
|
|
else { |
503
|
0
|
|
|
|
|
|
$qualsum += $quals[$count2]; |
504
|
|
|
|
|
|
|
} |
505
|
|
|
|
|
|
|
} |
506
|
0
|
0
|
|
|
|
|
if ($qualsum < $bases_counted*$phreds) { |
507
|
0
|
|
|
|
|
|
return $count+$bases_counted+$windowsize; |
508
|
|
|
|
|
|
|
} |
509
|
|
|
|
|
|
|
else { } |
510
|
0
|
|
|
|
|
|
$qualsum = 0; |
511
|
|
|
|
|
|
|
} # end for |
512
|
0
|
0
|
|
|
|
|
if ($end_of_quals) { |
513
|
0
|
|
|
|
|
|
my $bases_for_average = $total_bases-$count2; |
514
|
0
|
|
|
|
|
|
return $count2; |
515
|
|
|
|
|
|
|
} |
516
|
|
|
|
|
|
|
else { } |
517
|
0
|
0
|
|
|
|
|
if ($qualsum) { } # print ("$qualsum\n"); |
518
|
0
|
|
|
|
|
|
return $total_bases; |
519
|
|
|
|
|
|
|
} # end get_end |
520
|
|
|
|
|
|
|
|
521
|
|
|
|
|
|
|
=head2 count_doublet_trailing_zeros($r_qual) |
522
|
|
|
|
|
|
|
|
523
|
|
|
|
|
|
|
Title : count_doublet_trailing_zeros($r_qual) |
524
|
|
|
|
|
|
|
Usage : my $start_of_trailing_zeros = &count_doublet_trailing_zeros(\@qual); |
525
|
|
|
|
|
|
|
Function: Find out when the trailing zero qualities start. |
526
|
|
|
|
|
|
|
Returns : A scalar representing where the zeros start. |
527
|
|
|
|
|
|
|
Args : A reference to an array of quality values. |
528
|
|
|
|
|
|
|
Notes : Again, this should be rewritten to use PrimaryQual objects. |
529
|
|
|
|
|
|
|
A more detailed explanation of why phrap puts these zeros here should |
530
|
|
|
|
|
|
|
be written and placed here. Please email and hassle the author. |
531
|
|
|
|
|
|
|
|
532
|
|
|
|
|
|
|
|
533
|
|
|
|
|
|
|
=cut |
534
|
|
|
|
|
|
|
|
535
|
|
|
|
|
|
|
sub count_doublet_trailing_zeros { |
536
|
0
|
|
|
0
|
1
|
|
my ($r_qual) = shift; |
537
|
0
|
|
|
|
|
|
my $number_of_trailing_zeros = 0; |
538
|
0
|
|
|
|
|
|
my @qualities = @$r_qual; |
539
|
0
|
|
|
|
|
|
for (my $current=scalar(@qualities);$current>0;$current--) { |
540
|
0
|
0
|
0
|
|
|
|
if ($qualities[$current] && $qualities[$current] != 0) { |
541
|
0
|
|
|
|
|
|
$number_of_trailing_zeros = scalar(@qualities)-$current; |
542
|
0
|
|
|
|
|
|
return $current+1; |
543
|
|
|
|
|
|
|
} |
544
|
|
|
|
|
|
|
} |
545
|
0
|
|
|
|
|
|
return scalar(@qualities); |
546
|
|
|
|
|
|
|
} # end count_doublet_trailing_zeros |
547
|
|
|
|
|
|
|
|
548
|
|
|
|
|
|
|
=head2 _sliding_window($r_quals,$windowsize) |
549
|
|
|
|
|
|
|
|
550
|
|
|
|
|
|
|
Title : _sliding_window($r_quals,$windowsize) |
551
|
|
|
|
|
|
|
Usage : my $r_windows = &_sliding_window(\@qual,$windowsize); |
552
|
|
|
|
|
|
|
Function: Create a sliding window, look-forward-average on an array |
553
|
|
|
|
|
|
|
of quality values. Used to smooth out differences in qualities. |
554
|
|
|
|
|
|
|
Returns : A reference to an array containing the smoothed values. |
555
|
|
|
|
|
|
|
Args : $r_quals: A reference to an array containing quality values. |
556
|
|
|
|
|
|
|
$windowsize : The size of the sliding window. |
557
|
|
|
|
|
|
|
Notes : This was written before PrimaryQual objects existed. They |
558
|
|
|
|
|
|
|
should use that object but I haven't rewritten this yet. |
559
|
|
|
|
|
|
|
|
560
|
|
|
|
|
|
|
=cut |
561
|
|
|
|
|
|
|
|
562
|
|
|
|
|
|
|
#' |
563
|
|
|
|
|
|
|
sub _sliding_window { |
564
|
0
|
|
|
0
|
|
|
my ($r_quals,$windowsize) = @_; |
565
|
0
|
|
|
|
|
|
my (@window,@quals,$qualsum,$count,$count2,$average,@averages,$bases_counted); |
566
|
0
|
|
|
|
|
|
@quals = @$r_quals; |
567
|
0
|
|
|
|
|
|
my $size_of_quality = scalar(@quals); |
568
|
|
|
|
|
|
|
# do this loop for all of the qualities |
569
|
0
|
|
|
|
|
|
for ($count=0; $count <= $size_of_quality; $count++) { |
570
|
0
|
|
|
|
|
|
$bases_counted = 0; |
571
|
0
|
|
|
|
|
|
BASE: for($count2 = $count; $count2 < $size_of_quality; $count2++) { |
572
|
0
|
|
|
|
|
|
$bases_counted++; |
573
|
|
|
|
|
|
|
# if the search hits the end of the averages, stop |
574
|
|
|
|
|
|
|
# this is for the case near the end where bases remaining < windowsize |
575
|
0
|
0
|
|
|
|
|
if ($count2 == $size_of_quality) { |
|
|
0
|
|
|
|
|
|
576
|
0
|
|
|
|
|
|
$qualsum += $quals[$count2]; |
577
|
0
|
|
|
|
|
|
last BASE; |
578
|
|
|
|
|
|
|
} |
579
|
|
|
|
|
|
|
# if the search hits the size of the window |
580
|
|
|
|
|
|
|
elsif ($bases_counted == $windowsize) { |
581
|
0
|
|
|
|
|
|
$qualsum += $quals[$count2]; |
582
|
0
|
|
|
|
|
|
last BASE; |
583
|
|
|
|
|
|
|
} |
584
|
|
|
|
|
|
|
# otherwise add the quality value |
585
|
0
|
0
|
|
|
|
|
unless (!$quals[$count2]) { |
586
|
0
|
|
|
|
|
|
$qualsum += $quals[$count2]; |
587
|
|
|
|
|
|
|
} |
588
|
|
|
|
|
|
|
} |
589
|
0
|
0
|
0
|
|
|
|
unless (!$qualsum || !$windowsize) { |
590
|
0
|
|
|
|
|
|
$average = $qualsum / $bases_counted; |
591
|
0
|
0
|
|
|
|
|
if (!$average) { $average = "0"; } |
|
0
|
|
|
|
|
|
|
592
|
0
|
|
|
|
|
|
push @averages,$average; |
593
|
|
|
|
|
|
|
} |
594
|
0
|
|
|
|
|
|
$qualsum = 0; |
595
|
|
|
|
|
|
|
} |
596
|
|
|
|
|
|
|
# 02101 Yes, I repaired the mismatching numbers between averages and windows. |
597
|
|
|
|
|
|
|
# print("There are ".scalar(@$r_quals)." quality values. They are @$r_quals\n"); |
598
|
|
|
|
|
|
|
# print("There are ".scalar(@averages)." average values. They are @averages\n"); |
599
|
0
|
|
|
|
|
|
return \@averages; |
600
|
|
|
|
|
|
|
|
601
|
|
|
|
|
|
|
} |
602
|
|
|
|
|
|
|
|
603
|
|
|
|
|
|
|
=head2 _print_formatted_qualities |
604
|
|
|
|
|
|
|
|
605
|
|
|
|
|
|
|
Title : _print_formatted_qualities(\@quals) |
606
|
|
|
|
|
|
|
Usage : &_print_formatted_qualities(\@quals); |
607
|
|
|
|
|
|
|
Returns : Nothing. Prints. |
608
|
|
|
|
|
|
|
Args : A reference to an array containing quality values. |
609
|
|
|
|
|
|
|
Notes : An internal procedure used in debugging. Prints out an array nicely. |
610
|
|
|
|
|
|
|
|
611
|
|
|
|
|
|
|
=cut |
612
|
|
|
|
|
|
|
|
613
|
|
|
|
|
|
|
sub _print_formatted_qualities { |
614
|
0
|
|
|
0
|
|
|
my $rquals = shift; |
615
|
0
|
|
|
|
|
|
my @qual = @$rquals; |
616
|
0
|
|
|
|
|
|
for (my $count=0; $count
|
617
|
0
|
0
|
|
|
|
|
if (($count%10)==0) { print("\n$count\t"); } |
|
0
|
|
|
|
|
|
|
618
|
0
|
0
|
|
|
|
|
if ($qual[$count]) { print ("$qual[$count]\t");} |
|
0
|
|
|
|
|
|
|
619
|
0
|
|
|
|
|
|
else { print("0\t"); } |
620
|
|
|
|
|
|
|
} |
621
|
0
|
|
|
|
|
|
print("\n"); |
622
|
|
|
|
|
|
|
} |
623
|
|
|
|
|
|
|
|
624
|
|
|
|
|
|
|
=head2 _get_end_old($r_qual,$windowsize,$phreds,$count) |
625
|
|
|
|
|
|
|
|
626
|
|
|
|
|
|
|
Title : _get_end_old($r_qual,$windowsize,$phreds,$count) |
627
|
|
|
|
|
|
|
Usage : Deprecated. Don't use this! |
628
|
|
|
|
|
|
|
Returns : Deprecated. Don't use this! |
629
|
|
|
|
|
|
|
Args : Deprecated. Don't use this! |
630
|
|
|
|
|
|
|
|
631
|
|
|
|
|
|
|
=cut |
632
|
|
|
|
|
|
|
|
633
|
|
|
|
|
|
|
#' |
634
|
|
|
|
|
|
|
sub _get_end_old { |
635
|
0
|
|
|
0
|
|
|
my ($r_qual,$windowsize,$phreds,$count) = @_; |
636
|
0
|
|
|
|
|
|
warn("Do Not Use this function (_get_end_old)"); |
637
|
0
|
|
|
|
|
|
my $target = $windowsize*$phreds; |
638
|
0
|
|
|
|
|
|
my @quals = @$r_qual; |
639
|
0
|
|
|
|
|
|
my $total_bases = scalar(@quals); |
640
|
0
|
|
|
|
|
|
my ($count2,$qualsum,$end_of_quals); |
641
|
0
|
0
|
|
|
|
|
if (!$count) { $count=0; } |
|
0
|
|
|
|
|
|
|
642
|
0
|
|
|
|
|
|
BASE: for (; $count < $total_bases; $count++) { |
643
|
0
|
|
|
|
|
|
for($count2 = $count; $count2 < $count+$windowsize; $count2++) { |
644
|
0
|
0
|
|
|
|
|
if ($count2 == scalar(@quals)-1) { |
645
|
0
|
|
|
|
|
|
$qualsum += $quals[$count2]; |
646
|
0
|
|
|
|
|
|
$end_of_quals = 1; |
647
|
0
|
|
|
|
|
|
last BASE; |
648
|
|
|
|
|
|
|
|
649
|
|
|
|
|
|
|
} |
650
|
0
|
|
|
|
|
|
$qualsum += $quals[$count2]; |
651
|
|
|
|
|
|
|
} |
652
|
0
|
0
|
|
|
|
|
if ($qualsum < $windowsize*$phreds) { |
653
|
0
|
|
|
|
|
|
return $count+$windowsize; |
654
|
|
|
|
|
|
|
} |
655
|
0
|
|
|
|
|
|
$qualsum = 0; |
656
|
|
|
|
|
|
|
} # end for |
657
|
|
|
|
|
|
|
} # end get_end_old |
658
|
|
|
|
|
|
|
|
659
|
|
|
|
|
|
|
|
660
|
|
|
|
|
|
|
# Autoload methods go after =cut, and are processed by the autosplit program. |
661
|
|
|
|
|
|
|
|
662
|
|
|
|
|
|
|
1; |
663
|
|
|
|
|
|
|
__END__ |