line |
stmt |
bran |
cond |
sub |
pod |
time |
code |
1
|
|
|
|
|
|
|
# |
2
|
|
|
|
|
|
|
# BioPerl module for Bio::Seq::SequenceTrace |
3
|
|
|
|
|
|
|
# |
4
|
|
|
|
|
|
|
# Please direct questions and support issues to |
5
|
|
|
|
|
|
|
# |
6
|
|
|
|
|
|
|
# Cared for by Chad Matsalla
|
7
|
|
|
|
|
|
|
# |
8
|
|
|
|
|
|
|
# Copyright Chad Matsalla |
9
|
|
|
|
|
|
|
# |
10
|
|
|
|
|
|
|
# You may distribute this module under the same terms as perl itself |
11
|
|
|
|
|
|
|
|
12
|
|
|
|
|
|
|
# POD documentation - main docs before the code |
13
|
|
|
|
|
|
|
|
14
|
|
|
|
|
|
|
=head1 NAME |
15
|
|
|
|
|
|
|
|
16
|
|
|
|
|
|
|
Bio::Seq::SequenceTrace - Bioperl object packaging a sequence with its trace |
17
|
|
|
|
|
|
|
|
18
|
|
|
|
|
|
|
=head1 SYNOPSIS |
19
|
|
|
|
|
|
|
|
20
|
|
|
|
|
|
|
# example code here |
21
|
|
|
|
|
|
|
|
22
|
|
|
|
|
|
|
=head1 DESCRIPTION |
23
|
|
|
|
|
|
|
|
24
|
|
|
|
|
|
|
This object stores a sequence with its trace. |
25
|
|
|
|
|
|
|
|
26
|
|
|
|
|
|
|
=head1 FEEDBACK |
27
|
|
|
|
|
|
|
|
28
|
|
|
|
|
|
|
=head2 Mailing Lists |
29
|
|
|
|
|
|
|
|
30
|
|
|
|
|
|
|
User feedback is an integral part of the evolution of this and other |
31
|
|
|
|
|
|
|
Bioperl modules. Send your comments and suggestions preferably to one |
32
|
|
|
|
|
|
|
of the Bioperl mailing lists. Your participation is much appreciated. |
33
|
|
|
|
|
|
|
|
34
|
|
|
|
|
|
|
bioperl-l@bioperl.org - General discussion |
35
|
|
|
|
|
|
|
http://bioperl.org/wiki/Mailing_lists - About the mailing lists |
36
|
|
|
|
|
|
|
|
37
|
|
|
|
|
|
|
=head2 Support |
38
|
|
|
|
|
|
|
|
39
|
|
|
|
|
|
|
Please direct usage questions or support issues to the mailing list: |
40
|
|
|
|
|
|
|
|
41
|
|
|
|
|
|
|
I |
42
|
|
|
|
|
|
|
|
43
|
|
|
|
|
|
|
rather than to the module maintainer directly. Many experienced and |
44
|
|
|
|
|
|
|
reponsive experts will be able look at the problem and quickly |
45
|
|
|
|
|
|
|
address it. Please include a thorough description of the problem |
46
|
|
|
|
|
|
|
with code and data examples if at all possible. |
47
|
|
|
|
|
|
|
|
48
|
|
|
|
|
|
|
=head2 Reporting Bugs |
49
|
|
|
|
|
|
|
|
50
|
|
|
|
|
|
|
Report bugs to the Bioperl bug tracking system to help us keep track |
51
|
|
|
|
|
|
|
the bugs and their resolution. Bug reports can be submitted via the |
52
|
|
|
|
|
|
|
web: |
53
|
|
|
|
|
|
|
|
54
|
|
|
|
|
|
|
https://github.com/bioperl/bioperl-live/issues |
55
|
|
|
|
|
|
|
|
56
|
|
|
|
|
|
|
=head1 AUTHOR - Chad Matsalla |
57
|
|
|
|
|
|
|
|
58
|
|
|
|
|
|
|
Email bioinformatics@dieselwurks.com |
59
|
|
|
|
|
|
|
|
60
|
|
|
|
|
|
|
|
61
|
|
|
|
|
|
|
The rest of the documentation details each of the object methods. |
62
|
|
|
|
|
|
|
Internal methods are usually preceded with a _ |
63
|
|
|
|
|
|
|
|
64
|
|
|
|
|
|
|
=cut |
65
|
|
|
|
|
|
|
|
66
|
|
|
|
|
|
|
|
67
|
|
|
|
|
|
|
package Bio::Seq::SequenceTrace; |
68
|
|
|
|
|
|
|
|
69
|
|
|
|
|
|
|
|
70
|
1
|
|
|
1
|
|
3
|
use strict; |
|
1
|
|
|
|
|
2
|
|
|
1
|
|
|
|
|
23
|
|
71
|
1
|
|
|
1
|
|
257
|
use Bio::Seq::QualI; |
|
1
|
|
|
|
|
2
|
|
|
1
|
|
|
|
|
18
|
|
72
|
1
|
|
|
1
|
|
297
|
use Bio::PrimarySeqI; |
|
1
|
|
|
|
|
2
|
|
|
1
|
|
|
|
|
24
|
|
73
|
1
|
|
|
1
|
|
465
|
use Bio::PrimarySeq; |
|
1
|
|
|
|
|
2
|
|
|
1
|
|
|
|
|
23
|
|
74
|
1
|
|
|
1
|
|
283
|
use Bio::Seq::PrimaryQual; |
|
1
|
|
|
|
|
2
|
|
|
1
|
|
|
|
|
25
|
|
75
|
|
|
|
|
|
|
|
76
|
1
|
|
|
1
|
|
5
|
use base qw(Bio::Root::Root Bio::Seq::Quality Bio::Seq::TraceI); |
|
1
|
|
|
|
|
1
|
|
|
1
|
|
|
|
|
343
|
|
77
|
|
|
|
|
|
|
|
78
|
|
|
|
|
|
|
=head2 new() |
79
|
|
|
|
|
|
|
|
80
|
|
|
|
|
|
|
Title : new() |
81
|
|
|
|
|
|
|
Usage : $st = Bio::Seq::SequenceTrace->new |
82
|
|
|
|
|
|
|
( -swq => Bio::Seq::SequenceWithQuality, |
83
|
|
|
|
|
|
|
-trace_a => \@trace_values_for_a_channel, |
84
|
|
|
|
|
|
|
-trace_t => \@trace_values_for_t_channel, |
85
|
|
|
|
|
|
|
-trace_g => \@trace_values_for_g_channel, |
86
|
|
|
|
|
|
|
-trace_c => \@trace_values_for_c_channel, |
87
|
|
|
|
|
|
|
-accuracy_a => \@a_accuracies, |
88
|
|
|
|
|
|
|
-accuracy_t => \@t_accuracies, |
89
|
|
|
|
|
|
|
-accuracy_g => \@g_accuracies, |
90
|
|
|
|
|
|
|
-accuracy_c => \@c_accuracies, |
91
|
|
|
|
|
|
|
-peak_indices => '0 5 10 15 20 25 30 35' |
92
|
|
|
|
|
|
|
); |
93
|
|
|
|
|
|
|
Function: Returns a new Bio::Seq::SequenceTrace object from basic |
94
|
|
|
|
|
|
|
constructors. |
95
|
|
|
|
|
|
|
Returns : a new Bio::Seq::SequenceTrace object |
96
|
|
|
|
|
|
|
Arguments: I think that these are all describes in the usage above. |
97
|
|
|
|
|
|
|
|
98
|
|
|
|
|
|
|
=cut |
99
|
|
|
|
|
|
|
|
100
|
|
|
|
|
|
|
sub new { |
101
|
20
|
|
|
20
|
1
|
86
|
my ($class, @args) = @_; |
102
|
20
|
|
|
|
|
71
|
my $self = $class->SUPER::new(@args); |
103
|
|
|
|
|
|
|
# default: turn OFF the warnings |
104
|
20
|
|
|
|
|
36
|
$self->{supress_warnings} = 1; |
105
|
20
|
|
|
|
|
155
|
my($swq,$peak_indices,$trace_a,$trace_t, |
106
|
|
|
|
|
|
|
$trace_g,$trace_c,$acc_a,$acc_t,$acc_g,$acc_c) = |
107
|
|
|
|
|
|
|
$self->_rearrange([qw( |
108
|
|
|
|
|
|
|
SWQ |
109
|
|
|
|
|
|
|
PEAK_INDICES |
110
|
|
|
|
|
|
|
TRACE_A |
111
|
|
|
|
|
|
|
TRACE_T |
112
|
|
|
|
|
|
|
TRACE_G |
113
|
|
|
|
|
|
|
TRACE_C |
114
|
|
|
|
|
|
|
ACCURACY_A |
115
|
|
|
|
|
|
|
ACCURACY_T |
116
|
|
|
|
|
|
|
ACCURACY_G |
117
|
|
|
|
|
|
|
ACCURACY_C )], @args); |
118
|
|
|
|
|
|
|
# first, deal with the sequence and quality information |
119
|
20
|
50
|
33
|
|
|
131
|
if ($swq && ref($swq) eq "Bio::Seq::Quality") { |
120
|
20
|
|
|
|
|
45
|
$self->{swq} = $swq; |
121
|
|
|
|
|
|
|
} |
122
|
|
|
|
|
|
|
else { |
123
|
0
|
|
|
|
|
0
|
$self->throw("A Bio::Seq::SequenceTrace object must be created with a |
124
|
|
|
|
|
|
|
Bio::Seq::Quality object. You provided this type of object: " |
125
|
|
|
|
|
|
|
.ref($swq)); |
126
|
|
|
|
|
|
|
} |
127
|
20
|
100
|
|
|
|
43
|
if (!$acc_a) { |
128
|
|
|
|
|
|
|
# this means that you probably did not provide traces and accuracies |
129
|
|
|
|
|
|
|
# and that they need to be synthesized |
130
|
5
|
|
|
|
|
19
|
$self->set_accuracies(); |
131
|
|
|
|
|
|
|
} |
132
|
|
|
|
|
|
|
else { |
133
|
15
|
|
|
|
|
69
|
$self->accuracies('a',$acc_a); |
134
|
15
|
|
|
|
|
39
|
$self->accuracies('t',$acc_t); |
135
|
15
|
|
|
|
|
27
|
$self->accuracies('g',$acc_g); |
136
|
15
|
|
|
|
|
40
|
$self->accuracies('c',$acc_c); |
137
|
|
|
|
|
|
|
} |
138
|
20
|
100
|
|
|
|
40
|
if (!$trace_a) { |
139
|
3
|
|
|
|
|
12
|
$self->_synthesize_traces(); |
140
|
|
|
|
|
|
|
} |
141
|
|
|
|
|
|
|
else { |
142
|
17
|
|
|
|
|
45
|
$self->trace('a',$trace_a); |
143
|
17
|
|
|
|
|
41
|
$self->trace('t',$trace_t); |
144
|
17
|
|
|
|
|
45
|
$self->trace('g',$trace_g); |
145
|
17
|
|
|
|
|
40
|
$self->trace('c',$trace_c); |
146
|
17
|
|
|
|
|
54
|
$self->peak_indices($peak_indices); |
147
|
|
|
|
|
|
|
} |
148
|
20
|
|
|
|
|
72
|
$self->id($self->seq_obj->id); |
149
|
20
|
|
|
|
|
111
|
return $self; |
150
|
|
|
|
|
|
|
} |
151
|
|
|
|
|
|
|
|
152
|
|
|
|
|
|
|
sub swq_obj { |
153
|
0
|
|
|
0
|
0
|
0
|
my $self = shift; |
154
|
0
|
|
|
|
|
0
|
$self->warn('swq_obj() is deprecated: use seq_obj()'); |
155
|
0
|
|
|
|
|
0
|
return $self->{swq}; |
156
|
|
|
|
|
|
|
} |
157
|
|
|
|
|
|
|
|
158
|
|
|
|
|
|
|
|
159
|
|
|
|
|
|
|
|
160
|
|
|
|
|
|
|
=head2 trace($base,\@new_values) |
161
|
|
|
|
|
|
|
|
162
|
|
|
|
|
|
|
Title : trace($base,\@new_values) |
163
|
|
|
|
|
|
|
Usage : @trace_Values = @{$obj->trace($base,\@new_values)}; |
164
|
|
|
|
|
|
|
Function: Returns the trace values as a reference to an array containing the |
165
|
|
|
|
|
|
|
trace values. The individual elements of the trace array are not validated |
166
|
|
|
|
|
|
|
and can be any numeric value. |
167
|
|
|
|
|
|
|
Returns : A reference to an array. |
168
|
|
|
|
|
|
|
Status : |
169
|
|
|
|
|
|
|
Arguments: $base : which color channel would you like the trace values for? |
170
|
|
|
|
|
|
|
- $base must be one of "A","T","G","C" |
171
|
|
|
|
|
|
|
\@new_values : a reference to an array of values containing trace |
172
|
|
|
|
|
|
|
data for this base |
173
|
|
|
|
|
|
|
|
174
|
|
|
|
|
|
|
=cut |
175
|
|
|
|
|
|
|
|
176
|
|
|
|
|
|
|
sub trace { |
177
|
518822
|
|
|
518822
|
1
|
376849
|
my ($self,$base_channel,$values) = @_; |
178
|
518822
|
50
|
|
|
|
544959
|
if (!$base_channel) { |
179
|
0
|
|
|
|
|
0
|
$self->throw('You must provide a valid base channel (atgc) to use trace()'); |
180
|
|
|
|
|
|
|
} |
181
|
518822
|
|
|
|
|
368183
|
$base_channel =~ tr/A-Z/a-z/; |
182
|
518822
|
50
|
|
|
|
835739
|
if ($base_channel !~ /[acgt]/) { |
183
|
0
|
|
|
|
|
0
|
$self->throw('You must provide a valid base channel (atgc) to use trace()'); |
184
|
|
|
|
|
|
|
} |
185
|
518822
|
100
|
|
|
|
572416
|
if ($values) { |
186
|
84
|
100
|
|
|
|
143
|
if (ref($values) eq "ARRAY") { |
187
|
40
|
|
|
|
|
65
|
$self->{trace}->{$base_channel} = $values; |
188
|
|
|
|
|
|
|
} |
189
|
|
|
|
|
|
|
else { |
190
|
44
|
|
|
|
|
46608
|
my @trace = split(' ',$values); |
191
|
44
|
|
|
|
|
177
|
$self->{trace}->{$base_channel} = \@trace; |
192
|
|
|
|
|
|
|
} |
193
|
|
|
|
|
|
|
} |
194
|
518822
|
50
|
|
|
|
551281
|
if ($self->{trace}->{$base_channel}) { |
195
|
518822
|
|
|
|
|
792483
|
return $self->{trace}->{$base_channel}; |
196
|
|
|
|
|
|
|
} |
197
|
|
|
|
|
|
|
else { |
198
|
0
|
|
|
|
|
0
|
return; |
199
|
|
|
|
|
|
|
} |
200
|
|
|
|
|
|
|
} |
201
|
|
|
|
|
|
|
|
202
|
|
|
|
|
|
|
|
203
|
|
|
|
|
|
|
=head2 peak_indices($new_indices) |
204
|
|
|
|
|
|
|
|
205
|
|
|
|
|
|
|
Title : peak_indices($new_indices) |
206
|
|
|
|
|
|
|
Usage : $indices = $obj->peak_indices($new_indices); |
207
|
|
|
|
|
|
|
Function: Return the trace index points for this object. |
208
|
|
|
|
|
|
|
Returns : A scalar |
209
|
|
|
|
|
|
|
Args : If used, the trace indices will be set to the provided value. |
210
|
|
|
|
|
|
|
|
211
|
|
|
|
|
|
|
=cut |
212
|
|
|
|
|
|
|
|
213
|
|
|
|
|
|
|
sub peak_indices { |
214
|
1539
|
|
|
1539
|
1
|
2419
|
my ($self,$peak_indices)= @_; |
215
|
1539
|
100
|
|
|
|
1732
|
if ($peak_indices) { |
216
|
17
|
100
|
|
|
|
40
|
if (ref($peak_indices) eq "ARRAY") { |
217
|
6
|
|
|
|
|
13
|
$self->{peak_indices} = $peak_indices; |
218
|
|
|
|
|
|
|
} |
219
|
|
|
|
|
|
|
else { |
220
|
11
|
|
|
|
|
752
|
my @indices = split(' ',$peak_indices); |
221
|
11
|
|
|
|
|
23
|
$self->{peak_indices} = \@indices; |
222
|
|
|
|
|
|
|
} |
223
|
|
|
|
|
|
|
} |
224
|
1539
|
100
|
|
|
|
1909
|
if (!$self->{peak_indices}) { |
225
|
3
|
|
|
|
|
6
|
my @temp = (); |
226
|
3
|
|
|
|
|
7
|
$self->{peak_indices} = \@temp; |
227
|
|
|
|
|
|
|
} |
228
|
1539
|
|
|
|
|
2514
|
return $self->{peak_indices}; |
229
|
|
|
|
|
|
|
} |
230
|
|
|
|
|
|
|
|
231
|
|
|
|
|
|
|
|
232
|
|
|
|
|
|
|
=head2 _reset_peak_indices() |
233
|
|
|
|
|
|
|
|
234
|
|
|
|
|
|
|
Title : _rest_peak_indices() |
235
|
|
|
|
|
|
|
Usage : $obj->_reset_peak_indices(); |
236
|
|
|
|
|
|
|
Function: Reset the peak indices. |
237
|
|
|
|
|
|
|
Returns : Nothing. |
238
|
|
|
|
|
|
|
Args : None. |
239
|
|
|
|
|
|
|
Notes : When you create a sub_trace_object, the peak indices |
240
|
|
|
|
|
|
|
will still be pointing to the apporpriate location _in the |
241
|
|
|
|
|
|
|
original trace_. In order to fix this, the initial value must |
242
|
|
|
|
|
|
|
be subtracted from each value here. ie. The first peak index |
243
|
|
|
|
|
|
|
must be "1". |
244
|
|
|
|
|
|
|
|
245
|
|
|
|
|
|
|
=cut |
246
|
|
|
|
|
|
|
|
247
|
|
|
|
|
|
|
sub _reset_peak_indices { |
248
|
2
|
|
|
2
|
|
4
|
my $self = shift; |
249
|
2
|
|
|
|
|
6
|
my $length = $self->length(); |
250
|
2
|
|
|
|
|
7
|
my $subtractive = $self->peak_index_at(1); |
251
|
2
|
|
|
|
|
3
|
my ($original,$new); |
252
|
2
|
|
|
|
|
5
|
$self->peak_index_at(1,"null"); |
253
|
2
|
|
|
|
|
7
|
for (my $counter=2; $counter<= $length; $counter++) { |
254
|
49
|
|
|
|
|
49
|
my $original = $self->peak_index_at($counter); |
255
|
49
|
|
|
|
|
48
|
$new = $original - $subtractive; |
256
|
49
|
|
|
|
|
48
|
$self->peak_index_at($counter,$new); |
257
|
|
|
|
|
|
|
} |
258
|
2
|
|
|
|
|
3
|
return; |
259
|
|
|
|
|
|
|
} |
260
|
|
|
|
|
|
|
|
261
|
|
|
|
|
|
|
|
262
|
|
|
|
|
|
|
|
263
|
|
|
|
|
|
|
|
264
|
|
|
|
|
|
|
|
265
|
|
|
|
|
|
|
=head2 peak_index_at($position) |
266
|
|
|
|
|
|
|
|
267
|
|
|
|
|
|
|
Title : peak_index_at($position) |
268
|
|
|
|
|
|
|
Usage : $peak_index = $obj->peak_index_at($postition); |
269
|
|
|
|
|
|
|
Function: Return the trace iindex point at this position |
270
|
|
|
|
|
|
|
Returns : A scalar |
271
|
|
|
|
|
|
|
Args : If used, the trace index at this position will be |
272
|
|
|
|
|
|
|
set to the provided value. |
273
|
|
|
|
|
|
|
|
274
|
|
|
|
|
|
|
=cut |
275
|
|
|
|
|
|
|
|
276
|
|
|
|
|
|
|
sub peak_index_at { |
277
|
1291
|
|
|
1291
|
1
|
1376
|
my ($self,$position,$value)= @_; |
278
|
1291
|
100
|
|
|
|
1486
|
if ($value) { |
279
|
133
|
100
|
|
|
|
156
|
if ($value eq "null") { |
280
|
2
|
|
|
|
|
4
|
$self->peak_indices->[$position-1] = "0"; |
281
|
|
|
|
|
|
|
} |
282
|
|
|
|
|
|
|
else { |
283
|
131
|
|
|
|
|
137
|
$self->peak_indices->[$position-1] = $value; |
284
|
|
|
|
|
|
|
} |
285
|
|
|
|
|
|
|
} |
286
|
1291
|
|
|
|
|
1234
|
return $self->peak_indices()->[$position-1]; |
287
|
|
|
|
|
|
|
} |
288
|
|
|
|
|
|
|
|
289
|
|
|
|
|
|
|
=head2 alphabet() |
290
|
|
|
|
|
|
|
|
291
|
|
|
|
|
|
|
Title : alphabet(); |
292
|
|
|
|
|
|
|
Usage : $molecule_type = $obj->alphabet(); |
293
|
|
|
|
|
|
|
Function: Get the molecule type from the PrimarySeq object. |
294
|
|
|
|
|
|
|
Returns : What what PrimarySeq says the type of the sequence is. |
295
|
|
|
|
|
|
|
Args : None. |
296
|
|
|
|
|
|
|
|
297
|
|
|
|
|
|
|
=cut |
298
|
|
|
|
|
|
|
|
299
|
|
|
|
|
|
|
sub alphabet { |
300
|
1
|
|
|
1
|
1
|
2
|
my $self = shift; |
301
|
1
|
|
|
|
|
4
|
return $self->{swq}->alphabet; |
302
|
|
|
|
|
|
|
} |
303
|
|
|
|
|
|
|
|
304
|
|
|
|
|
|
|
=head2 display_id() |
305
|
|
|
|
|
|
|
|
306
|
|
|
|
|
|
|
Title : display_id() |
307
|
|
|
|
|
|
|
Usage : $id_string = $obj->display_id(); |
308
|
|
|
|
|
|
|
Function: Returns the display id, aka the common name of the Quality |
309
|
|
|
|
|
|
|
object. |
310
|
|
|
|
|
|
|
The semantics of this is that it is the most likely string to be |
311
|
|
|
|
|
|
|
used as an identifier of the quality sequence, and likely to have |
312
|
|
|
|
|
|
|
"human" readability. The id is equivalent to the ID field of the |
313
|
|
|
|
|
|
|
GenBank/EMBL databanks and the id field of the Swissprot/sptrembl |
314
|
|
|
|
|
|
|
database. In fasta format, the >(\S+) is presumed to be the id, |
315
|
|
|
|
|
|
|
though some people overload the id to embed other information. |
316
|
|
|
|
|
|
|
Bioperl does not use any embedded information in the ID field, |
317
|
|
|
|
|
|
|
and people are encouraged to use other mechanisms (accession |
318
|
|
|
|
|
|
|
field for example, or extending the sequence object) to solve |
319
|
|
|
|
|
|
|
this. Notice that $seq->id() maps to this function, mainly for |
320
|
|
|
|
|
|
|
legacy/convience issues. |
321
|
|
|
|
|
|
|
This method sets the display_id for the Quality object. |
322
|
|
|
|
|
|
|
Returns : A string |
323
|
|
|
|
|
|
|
Args : If a scalar is provided, it is set as the new display_id for |
324
|
|
|
|
|
|
|
the Quality object. |
325
|
|
|
|
|
|
|
Status : Virtual |
326
|
|
|
|
|
|
|
|
327
|
|
|
|
|
|
|
=cut |
328
|
|
|
|
|
|
|
|
329
|
|
|
|
|
|
|
sub display_id { |
330
|
11
|
|
|
11
|
1
|
3043
|
my ($self,$value) = @_; |
331
|
11
|
50
|
|
|
|
23
|
if( defined $value) { |
332
|
0
|
|
|
|
|
0
|
$self->{swq}->display_id($value); |
333
|
|
|
|
|
|
|
} |
334
|
11
|
|
|
|
|
28
|
return $self->{swq}->display_id(); |
335
|
|
|
|
|
|
|
|
336
|
|
|
|
|
|
|
} |
337
|
|
|
|
|
|
|
|
338
|
|
|
|
|
|
|
=head2 accession_number() |
339
|
|
|
|
|
|
|
|
340
|
|
|
|
|
|
|
Title : accession_number() |
341
|
|
|
|
|
|
|
Usage : $unique_biological_key = $obj->accession_number(); |
342
|
|
|
|
|
|
|
Function: Returns the unique biological id for a sequence, commonly |
343
|
|
|
|
|
|
|
called the accession_number. For sequences from established |
344
|
|
|
|
|
|
|
databases, the implementors should try to use the correct |
345
|
|
|
|
|
|
|
accession number. Notice that primary_id() provides the unique id |
346
|
|
|
|
|
|
|
for the implemetation, allowing multiple objects to have the same |
347
|
|
|
|
|
|
|
accession number in a particular implementation. For sequences |
348
|
|
|
|
|
|
|
with no accession number, this method should return "unknown". |
349
|
|
|
|
|
|
|
This method sets the accession_number for the Quality |
350
|
|
|
|
|
|
|
object. |
351
|
|
|
|
|
|
|
Returns : A string (the value of accession_number) |
352
|
|
|
|
|
|
|
Args : If a scalar is provided, it is set as the new accession_number |
353
|
|
|
|
|
|
|
for the Quality object. |
354
|
|
|
|
|
|
|
Status : Virtual |
355
|
|
|
|
|
|
|
|
356
|
|
|
|
|
|
|
|
357
|
|
|
|
|
|
|
=cut |
358
|
|
|
|
|
|
|
|
359
|
|
|
|
|
|
|
sub accession_number { |
360
|
1
|
|
|
1
|
1
|
2
|
my( $self, $acc ) = @_; |
361
|
1
|
50
|
|
|
|
4
|
if (defined $acc) { |
362
|
0
|
|
|
|
|
0
|
$self->{swq}->accession_number($acc); |
363
|
|
|
|
|
|
|
} else { |
364
|
1
|
|
|
|
|
11
|
$acc = $self->{swq}->accession_number(); |
365
|
1
|
50
|
|
|
|
4
|
$acc = 'unknown' unless defined $acc; |
366
|
|
|
|
|
|
|
} |
367
|
1
|
|
|
|
|
3
|
return $acc; |
368
|
|
|
|
|
|
|
} |
369
|
|
|
|
|
|
|
|
370
|
|
|
|
|
|
|
=head2 primary_id() |
371
|
|
|
|
|
|
|
|
372
|
|
|
|
|
|
|
Title : primary_id() |
373
|
|
|
|
|
|
|
Usage : $unique_implementation_key = $obj->primary_id(); |
374
|
|
|
|
|
|
|
Function: Returns the unique id for this object in this implementation. |
375
|
|
|
|
|
|
|
This allows implementations to manage their own object ids in a |
376
|
|
|
|
|
|
|
way the implementaiton can control clients can expect one id to |
377
|
|
|
|
|
|
|
map to one object. For sequences with no accession number, this |
378
|
|
|
|
|
|
|
method should return a stringified memory location. |
379
|
|
|
|
|
|
|
This method sets the primary_id for the Quality |
380
|
|
|
|
|
|
|
object. |
381
|
|
|
|
|
|
|
Returns : A string. (the value of primary_id) |
382
|
|
|
|
|
|
|
Args : If a scalar is provided, it is set as the new primary_id for |
383
|
|
|
|
|
|
|
the Quality object. |
384
|
|
|
|
|
|
|
|
385
|
|
|
|
|
|
|
=cut |
386
|
|
|
|
|
|
|
|
387
|
|
|
|
|
|
|
sub primary_id { |
388
|
2
|
|
|
2
|
1
|
4
|
my ($self,$value) = @_; |
389
|
2
|
100
|
|
|
|
7
|
if ($value) { |
390
|
1
|
|
|
|
|
4
|
$self->{swq}->primary_id($value); |
391
|
|
|
|
|
|
|
} |
392
|
2
|
|
|
|
|
13
|
return $self->{swq}->primary_id(); |
393
|
|
|
|
|
|
|
|
394
|
|
|
|
|
|
|
} |
395
|
|
|
|
|
|
|
|
396
|
|
|
|
|
|
|
=head2 desc() |
397
|
|
|
|
|
|
|
|
398
|
|
|
|
|
|
|
Title : desc() |
399
|
|
|
|
|
|
|
Usage : $qual->desc($newval); _or_ |
400
|
|
|
|
|
|
|
$description = $qual->desc(); |
401
|
|
|
|
|
|
|
Function: Get/set description text for this Quality object. |
402
|
|
|
|
|
|
|
Returns : A string. (the value of desc) |
403
|
|
|
|
|
|
|
Args : If a scalar is provided, it is set as the new desc for the |
404
|
|
|
|
|
|
|
Quality object. |
405
|
|
|
|
|
|
|
|
406
|
|
|
|
|
|
|
=cut |
407
|
|
|
|
|
|
|
|
408
|
|
|
|
|
|
|
sub desc { |
409
|
|
|
|
|
|
|
# a mechanism to set the desc for the Quality object. |
410
|
|
|
|
|
|
|
# probably will be used most often by set_common_features() |
411
|
2
|
|
|
2
|
1
|
4
|
my ($self,$value) = @_; |
412
|
2
|
100
|
|
|
|
7
|
if( defined $value) { |
413
|
1
|
|
|
|
|
6
|
$self->{swq}->desc($value); |
414
|
|
|
|
|
|
|
} |
415
|
2
|
|
|
|
|
10
|
return $self->{swq}->desc(); |
416
|
|
|
|
|
|
|
} |
417
|
|
|
|
|
|
|
|
418
|
|
|
|
|
|
|
=head2 id() |
419
|
|
|
|
|
|
|
|
420
|
|
|
|
|
|
|
Title : id() |
421
|
|
|
|
|
|
|
Usage : $id = $qual->id(); |
422
|
|
|
|
|
|
|
Function: Return the ID of the quality. This should normally be (and |
423
|
|
|
|
|
|
|
actually is in the implementation provided here) just a synonym |
424
|
|
|
|
|
|
|
for display_id(). |
425
|
|
|
|
|
|
|
Returns : A string. (the value of id) |
426
|
|
|
|
|
|
|
Args : If a scalar is provided, it is set as the new id for the |
427
|
|
|
|
|
|
|
Quality object. |
428
|
|
|
|
|
|
|
|
429
|
|
|
|
|
|
|
=cut |
430
|
|
|
|
|
|
|
|
431
|
|
|
|
|
|
|
sub id { |
432
|
36
|
|
|
36
|
1
|
451
|
my ($self,$value) = @_; |
433
|
36
|
50
|
|
|
|
72
|
if (!$self) { $self->throw("no value for self in $value"); } |
|
0
|
|
|
|
|
0
|
|
434
|
36
|
100
|
|
|
|
72
|
if( defined $value ) { |
435
|
10
|
|
|
|
|
29
|
$self->{swq}->display_id($value); |
436
|
|
|
|
|
|
|
} |
437
|
36
|
|
|
|
|
105
|
return $self->{swq}->display_id(); |
438
|
|
|
|
|
|
|
} |
439
|
|
|
|
|
|
|
|
440
|
|
|
|
|
|
|
=head2 seq |
441
|
|
|
|
|
|
|
|
442
|
|
|
|
|
|
|
Title : seq() |
443
|
|
|
|
|
|
|
Usage : $string = $obj->seq(); _or_ |
444
|
|
|
|
|
|
|
$obj->seq("atctatcatca"); |
445
|
|
|
|
|
|
|
Function: Returns the sequence that is contained in the imbedded in the |
446
|
|
|
|
|
|
|
PrimarySeq object within the Quality object |
447
|
|
|
|
|
|
|
Returns : A scalar (the seq() value for the imbedded PrimarySeq object.) |
448
|
|
|
|
|
|
|
Args : If a scalar is provided, the Quality object will |
449
|
|
|
|
|
|
|
attempt to set that as the sequence for the imbedded PrimarySeq |
450
|
|
|
|
|
|
|
object. Otherwise, the value of seq() for the PrimarySeq object |
451
|
|
|
|
|
|
|
is returned. |
452
|
|
|
|
|
|
|
Notes : This is probably not a good idea because you then should call |
453
|
|
|
|
|
|
|
length() to make sure that the sequence and quality are of the |
454
|
|
|
|
|
|
|
same length. Even then, how can you make sure that this sequence |
455
|
|
|
|
|
|
|
belongs with that quality? I provided this to give you rope to |
456
|
|
|
|
|
|
|
hang yourself with. Tie it to a strong device and use a good |
457
|
|
|
|
|
|
|
knot. |
458
|
|
|
|
|
|
|
|
459
|
|
|
|
|
|
|
=cut |
460
|
|
|
|
|
|
|
|
461
|
|
|
|
|
|
|
sub seq { |
462
|
49
|
|
|
49
|
1
|
796
|
my ($self,$value) = @_; |
463
|
49
|
50
|
|
|
|
108
|
if( defined $value) { |
464
|
0
|
|
|
|
|
0
|
$self->{swq}->seq($value); |
465
|
|
|
|
|
|
|
} |
466
|
49
|
|
|
|
|
122
|
return $self->{swq}->seq(); |
467
|
|
|
|
|
|
|
} |
468
|
|
|
|
|
|
|
|
469
|
|
|
|
|
|
|
=head2 qual() |
470
|
|
|
|
|
|
|
|
471
|
|
|
|
|
|
|
Title : qual() |
472
|
|
|
|
|
|
|
Usage : @quality_values = @{$obj->qual()}; _or_ |
473
|
|
|
|
|
|
|
$obj->qual("10 10 20 40 50"); |
474
|
|
|
|
|
|
|
Function: Returns the quality as imbedded in the PrimaryQual object |
475
|
|
|
|
|
|
|
within the Quality object. |
476
|
|
|
|
|
|
|
Returns : A reference to an array containing the quality values in the |
477
|
|
|
|
|
|
|
PrimaryQual object. |
478
|
|
|
|
|
|
|
Args : If a scalar is provided, the Quality object will |
479
|
|
|
|
|
|
|
attempt to set that as the quality for the imbedded PrimaryQual |
480
|
|
|
|
|
|
|
object. Otherwise, the value of qual() for the PrimaryQual |
481
|
|
|
|
|
|
|
object is returned. |
482
|
|
|
|
|
|
|
Notes : This is probably not a good idea because you then should call |
483
|
|
|
|
|
|
|
length() to make sure that the sequence and quality are of the |
484
|
|
|
|
|
|
|
same length. Even then, how can you make sure that this sequence |
485
|
|
|
|
|
|
|
belongs with that quality? I provided this to give you a strong |
486
|
|
|
|
|
|
|
board with which to flagellate yourself. |
487
|
|
|
|
|
|
|
|
488
|
|
|
|
|
|
|
=cut |
489
|
|
|
|
|
|
|
|
490
|
|
|
|
|
|
|
sub qual { |
491
|
9
|
|
|
9
|
1
|
4893
|
my ($self,$value) = @_; |
492
|
|
|
|
|
|
|
|
493
|
9
|
50
|
|
|
|
16
|
if( defined $value) { |
494
|
0
|
|
|
|
|
0
|
$self->{swq}->qual($value); |
495
|
|
|
|
|
|
|
} |
496
|
9
|
|
|
|
|
27
|
return $self->{swq}->qual(); |
497
|
|
|
|
|
|
|
} |
498
|
|
|
|
|
|
|
|
499
|
|
|
|
|
|
|
|
500
|
|
|
|
|
|
|
|
501
|
|
|
|
|
|
|
|
502
|
|
|
|
|
|
|
=head2 length() |
503
|
|
|
|
|
|
|
|
504
|
|
|
|
|
|
|
Title : length() |
505
|
|
|
|
|
|
|
Usage : $length = $seqWqual->length(); |
506
|
|
|
|
|
|
|
Function: Get the length of the Quality sequence/quality. |
507
|
|
|
|
|
|
|
Returns : Returns the length of the sequence and quality |
508
|
|
|
|
|
|
|
Args : None. |
509
|
|
|
|
|
|
|
|
510
|
|
|
|
|
|
|
=cut |
511
|
|
|
|
|
|
|
|
512
|
|
|
|
|
|
|
sub length { |
513
|
123
|
|
|
123
|
1
|
122
|
my $self = shift; |
514
|
123
|
|
|
|
|
192
|
return $self->seq_obj->length; |
515
|
|
|
|
|
|
|
} |
516
|
|
|
|
|
|
|
|
517
|
|
|
|
|
|
|
|
518
|
|
|
|
|
|
|
=head2 qual_obj |
519
|
|
|
|
|
|
|
|
520
|
|
|
|
|
|
|
Title : qual_obj($different_obj) |
521
|
|
|
|
|
|
|
Usage : $qualobj = $seqWqual->qual_obj(); _or_ |
522
|
|
|
|
|
|
|
$qualobj = $seqWqual->qual_obj($ref_to_primaryqual_obj); |
523
|
|
|
|
|
|
|
Function: Get the Qualilty object that is imbedded in the |
524
|
|
|
|
|
|
|
Quality object or if a reference to a PrimaryQual object |
525
|
|
|
|
|
|
|
is provided, set this as the PrimaryQual object imbedded in the |
526
|
|
|
|
|
|
|
Quality object. |
527
|
|
|
|
|
|
|
Returns : A reference to a Bio::Seq::Quality object. |
528
|
|
|
|
|
|
|
|
529
|
|
|
|
|
|
|
Identical to L. |
530
|
|
|
|
|
|
|
|
531
|
|
|
|
|
|
|
=cut |
532
|
|
|
|
|
|
|
|
533
|
|
|
|
|
|
|
sub qual_obj { |
534
|
267
|
|
|
267
|
1
|
212
|
my ($self,$value) = @_; |
535
|
|
|
|
|
|
|
# return $self->{swq}->qual_obj($value); |
536
|
267
|
|
|
|
|
471
|
return $self->{swq}; |
537
|
|
|
|
|
|
|
} |
538
|
|
|
|
|
|
|
|
539
|
|
|
|
|
|
|
|
540
|
|
|
|
|
|
|
=head2 seq_obj |
541
|
|
|
|
|
|
|
|
542
|
|
|
|
|
|
|
Title : seq_obj() |
543
|
|
|
|
|
|
|
Usage : $seqobj = $seqWqual->seq_obj(); _or_ |
544
|
|
|
|
|
|
|
$seqobj = $seqWqual->seq_obj($ref_to_primary_seq_obj); |
545
|
|
|
|
|
|
|
Function: Get the PrimarySeq object that is imbedded in the |
546
|
|
|
|
|
|
|
Quality object or if a reference to a PrimarySeq object is |
547
|
|
|
|
|
|
|
provided, set this as the PrimarySeq object imbedded in the |
548
|
|
|
|
|
|
|
Quality object. |
549
|
|
|
|
|
|
|
Returns : A reference to a Bio::PrimarySeq object. |
550
|
|
|
|
|
|
|
|
551
|
|
|
|
|
|
|
=cut |
552
|
|
|
|
|
|
|
|
553
|
|
|
|
|
|
|
sub seq_obj { |
554
|
427
|
|
|
427
|
1
|
849
|
my ($self,$value) = @_; |
555
|
427
|
|
|
|
|
970
|
return $self->{swq}; |
556
|
|
|
|
|
|
|
} |
557
|
|
|
|
|
|
|
|
558
|
|
|
|
|
|
|
=head2 _set_descriptors |
559
|
|
|
|
|
|
|
|
560
|
|
|
|
|
|
|
Title : _set_descriptors() |
561
|
|
|
|
|
|
|
Usage : $seqWqual->_qual_obj($qual,$seq,$id,$acc,$pid,$desc,$given_id, |
562
|
|
|
|
|
|
|
$alphabet); |
563
|
|
|
|
|
|
|
Function: Set the descriptors for the Quality object. Try to |
564
|
|
|
|
|
|
|
match the descriptors in the PrimarySeq object and in the |
565
|
|
|
|
|
|
|
PrimaryQual object if descriptors were not provided with |
566
|
|
|
|
|
|
|
construction. |
567
|
|
|
|
|
|
|
Returns : Nothing. |
568
|
|
|
|
|
|
|
Args : $qual,$seq,$id,$acc,$pid,$desc,$given_id,$alphabet as found |
569
|
|
|
|
|
|
|
in the new() method. |
570
|
|
|
|
|
|
|
Notes : Really only intended to be called by the new() method. If |
571
|
|
|
|
|
|
|
you want to invoke a similar function try |
572
|
|
|
|
|
|
|
set_common_descriptors(). |
573
|
|
|
|
|
|
|
|
574
|
|
|
|
|
|
|
=cut |
575
|
|
|
|
|
|
|
|
576
|
|
|
|
|
|
|
|
577
|
|
|
|
|
|
|
sub _set_descriptors { |
578
|
0
|
|
|
0
|
|
0
|
my ($self,$qual,$seq,$id,$acc,$pid,$desc,$given_id,$alphabet) = @_; |
579
|
0
|
|
|
|
|
0
|
$self->{swq}->_seq_descriptors($qual,$seq,$id,$acc,$pid, |
580
|
|
|
|
|
|
|
$desc,$given_id,$alphabet); |
581
|
|
|
|
|
|
|
} |
582
|
|
|
|
|
|
|
|
583
|
|
|
|
|
|
|
=head2 subseq($start,$end) |
584
|
|
|
|
|
|
|
|
585
|
|
|
|
|
|
|
Title : subseq($start,$end) |
586
|
|
|
|
|
|
|
Usage : $subsequence = $obj->subseq($start,$end); |
587
|
|
|
|
|
|
|
Function: Returns the subseq from start to end, where the first base |
588
|
|
|
|
|
|
|
is 1 and the number is inclusive, ie 1-2 are the first two |
589
|
|
|
|
|
|
|
bases of the sequence. |
590
|
|
|
|
|
|
|
Returns : A string. |
591
|
|
|
|
|
|
|
Args : Two positions. |
592
|
|
|
|
|
|
|
|
593
|
|
|
|
|
|
|
=cut |
594
|
|
|
|
|
|
|
|
595
|
|
|
|
|
|
|
sub subseq { |
596
|
3
|
|
|
3
|
1
|
9
|
my ($self,@args) = @_; |
597
|
|
|
|
|
|
|
# does a single value work? |
598
|
3
|
|
|
|
|
16
|
return $self->{swq}->subseq(@args); |
599
|
|
|
|
|
|
|
} |
600
|
|
|
|
|
|
|
|
601
|
|
|
|
|
|
|
=head2 baseat($position) |
602
|
|
|
|
|
|
|
|
603
|
|
|
|
|
|
|
Title : baseat($position) |
604
|
|
|
|
|
|
|
Usage : $base_at_position_6 = $obj->baseat("6"); |
605
|
|
|
|
|
|
|
Function: Returns a single base at the given position, where the first |
606
|
|
|
|
|
|
|
base is 1 and the number is inclusive, ie 1-2 are the first two |
607
|
|
|
|
|
|
|
bases of the sequence. |
608
|
|
|
|
|
|
|
Returns : A scalar. |
609
|
|
|
|
|
|
|
Args : A position. |
610
|
|
|
|
|
|
|
|
611
|
|
|
|
|
|
|
=cut |
612
|
|
|
|
|
|
|
|
613
|
|
|
|
|
|
|
sub baseat { |
614
|
1107
|
|
|
1107
|
1
|
771
|
my ($self,$val) = @_; |
615
|
1107
|
|
|
|
|
1491
|
return $self->{swq}->subseq($val,$val); |
616
|
|
|
|
|
|
|
} |
617
|
|
|
|
|
|
|
|
618
|
|
|
|
|
|
|
=head2 subqual($start,$end) |
619
|
|
|
|
|
|
|
|
620
|
|
|
|
|
|
|
Title : subqual($start,$end) |
621
|
|
|
|
|
|
|
Usage : @qualities = @{$obj->subqual(10,20); |
622
|
|
|
|
|
|
|
Function: returns the quality values from $start to $end, where the |
623
|
|
|
|
|
|
|
first value is 1 and the number is inclusive, ie 1-2 are the |
624
|
|
|
|
|
|
|
first two bases of the sequence. Start cannot be larger than |
625
|
|
|
|
|
|
|
end but can be equal. |
626
|
|
|
|
|
|
|
Returns : A reference to an array. |
627
|
|
|
|
|
|
|
Args : a start position and an end position |
628
|
|
|
|
|
|
|
|
629
|
|
|
|
|
|
|
=cut |
630
|
|
|
|
|
|
|
|
631
|
|
|
|
|
|
|
sub subqual { |
632
|
3
|
|
|
3
|
1
|
1808
|
my ($self,@args) = @_; |
633
|
3
|
|
|
|
|
13
|
return $self->{swq}->subqual(@args); |
634
|
|
|
|
|
|
|
} |
635
|
|
|
|
|
|
|
|
636
|
|
|
|
|
|
|
=head2 qualat($position) |
637
|
|
|
|
|
|
|
|
638
|
|
|
|
|
|
|
Title : qualat($position) |
639
|
|
|
|
|
|
|
Usage : $quality = $obj->qualat(10); |
640
|
|
|
|
|
|
|
Function: Return the quality value at the given location, where the |
641
|
|
|
|
|
|
|
first value is 1 and the number is inclusive, ie 1-2 are the |
642
|
|
|
|
|
|
|
first two bases of the sequence. Start cannot be larger than |
643
|
|
|
|
|
|
|
end but can be equal. |
644
|
|
|
|
|
|
|
Returns : A scalar. |
645
|
|
|
|
|
|
|
Args : A position. |
646
|
|
|
|
|
|
|
|
647
|
|
|
|
|
|
|
=cut |
648
|
|
|
|
|
|
|
|
649
|
|
|
|
|
|
|
sub qualat { |
650
|
1
|
|
|
1
|
1
|
2
|
my ($self,$val) = @_; |
651
|
1
|
|
|
|
|
6
|
return $self->{swq}->qualat($val); |
652
|
|
|
|
|
|
|
} |
653
|
|
|
|
|
|
|
|
654
|
|
|
|
|
|
|
=head2 sub_peak_index($start,$end) |
655
|
|
|
|
|
|
|
|
656
|
|
|
|
|
|
|
Title : sub_peak_index($start,$end) |
657
|
|
|
|
|
|
|
Usage : @peak_indices = @{$obj->sub_peak_index(10,20); |
658
|
|
|
|
|
|
|
Function: returns the trace index values from $start to $end, where the |
659
|
|
|
|
|
|
|
first value is 1 and the number is inclusive, ie 1-2 are the |
660
|
|
|
|
|
|
|
first two trace indices for this channel. |
661
|
|
|
|
|
|
|
Returns : A reference to an array. |
662
|
|
|
|
|
|
|
Args : a start position and an end position |
663
|
|
|
|
|
|
|
|
664
|
|
|
|
|
|
|
=cut |
665
|
|
|
|
|
|
|
|
666
|
|
|
|
|
|
|
sub sub_peak_index { |
667
|
6
|
|
|
6
|
1
|
429
|
my ($self,$start,$end) = @_; |
668
|
6
|
50
|
|
|
|
18
|
if( $start > $end ){ |
669
|
0
|
|
|
|
|
0
|
$self->throw("in sub_peak_index, start [$start] has to be greater than end [$end]"); |
670
|
|
|
|
|
|
|
} |
671
|
|
|
|
|
|
|
|
672
|
6
|
50
|
33
|
|
|
21
|
if( $start <= 0 || $end > $self->length ) { |
673
|
0
|
|
|
|
|
0
|
$self->throw("You have to have start positive and length less than the total length of sequence [$start:$end] Total ".$self->length.""); |
674
|
|
|
|
|
|
|
} |
675
|
|
|
|
|
|
|
|
676
|
|
|
|
|
|
|
# remove one from start, and then length is end-start |
677
|
|
|
|
|
|
|
|
678
|
6
|
|
|
|
|
7
|
$start--; |
679
|
6
|
|
|
|
|
7
|
$end--; |
680
|
6
|
|
|
|
|
10
|
my @sub_peak_index_array = @{$self->{peak_indices}}[$start..$end]; |
|
6
|
|
|
|
|
31
|
|
681
|
|
|
|
|
|
|
|
682
|
|
|
|
|
|
|
# return substr $self->seq(), $start, ($end-$start); |
683
|
6
|
|
|
|
|
29
|
return \@sub_peak_index_array; |
684
|
|
|
|
|
|
|
|
685
|
|
|
|
|
|
|
} |
686
|
|
|
|
|
|
|
|
687
|
|
|
|
|
|
|
=head2 sub_trace($start,$end) |
688
|
|
|
|
|
|
|
|
689
|
|
|
|
|
|
|
Title : sub_trace($base_channel,$start,$end) |
690
|
|
|
|
|
|
|
Usage : @trace_values = @{$obj->sub_trace('a',10,20)}; |
691
|
|
|
|
|
|
|
Function: returns the trace values from $start to $end, where the |
692
|
|
|
|
|
|
|
first value is 1 and the number is inclusive, ie 1-2 are the |
693
|
|
|
|
|
|
|
first two bases of the sequence. Start cannot be larger than |
694
|
|
|
|
|
|
|
end but can be e_peak_index. |
695
|
|
|
|
|
|
|
Returns : A reference to an array. |
696
|
|
|
|
|
|
|
Args : a start position and an end position |
697
|
|
|
|
|
|
|
|
698
|
|
|
|
|
|
|
=cut |
699
|
|
|
|
|
|
|
|
700
|
|
|
|
|
|
|
sub sub_trace { |
701
|
57504
|
|
|
57504
|
1
|
39726
|
my ($self,$base_channel,$start,$end) = @_; |
702
|
57504
|
50
|
|
|
|
67235
|
if( $start > $end ){ |
703
|
0
|
|
|
|
|
0
|
$self->throw("in sub_trace, start [$start] has to be greater than end [$end]"); |
704
|
|
|
|
|
|
|
} |
705
|
|
|
|
|
|
|
|
706
|
57504
|
50
|
33
|
|
|
89593
|
if( $start <= 0 || $end > $self->trace_length() ) { |
707
|
0
|
|
|
|
|
0
|
$self->throw("You have to have start positive and length less than the total length of traces [$start:$end] Total ".$self->trace_length.""); |
708
|
|
|
|
|
|
|
} |
709
|
|
|
|
|
|
|
|
710
|
|
|
|
|
|
|
# remove one from start, and then length is end-start |
711
|
|
|
|
|
|
|
|
712
|
57504
|
|
|
|
|
36782
|
$start--; |
713
|
57504
|
|
|
|
|
33309
|
$end--; |
714
|
57504
|
|
|
|
|
44294
|
my @sub_peak_index_array = @{$self->trace($base_channel)}[$start..$end]; |
|
57504
|
|
|
|
|
55440
|
|
715
|
|
|
|
|
|
|
|
716
|
|
|
|
|
|
|
# return substr $self->seq(), $start, ($end-$start); |
717
|
57504
|
|
|
|
|
132930
|
return \@sub_peak_index_array; |
718
|
|
|
|
|
|
|
|
719
|
|
|
|
|
|
|
} |
720
|
|
|
|
|
|
|
|
721
|
|
|
|
|
|
|
=head2 trace_length() |
722
|
|
|
|
|
|
|
|
723
|
|
|
|
|
|
|
Title : trace_length() |
724
|
|
|
|
|
|
|
Usage : $trace_length = $obj->trace_length(); |
725
|
|
|
|
|
|
|
Function: Return the length of the trace if all four traces (atgc) |
726
|
|
|
|
|
|
|
are the same. Otherwise, throw an error. |
727
|
|
|
|
|
|
|
Returns : A scalar. |
728
|
|
|
|
|
|
|
Args : none |
729
|
|
|
|
|
|
|
|
730
|
|
|
|
|
|
|
=cut |
731
|
|
|
|
|
|
|
|
732
|
|
|
|
|
|
|
sub trace_length { |
733
|
57516
|
|
|
57516
|
1
|
39819
|
my $self = shift; |
734
|
57516
|
50
|
33
|
|
|
57831
|
if ( !$self->trace('a') || !$self->trace('t') || !$self->trace('g') || !$self->trace('c') ) { |
|
|
|
33
|
|
|
|
|
|
|
|
33
|
|
|
|
|
735
|
0
|
|
|
|
|
0
|
$self->warn("One or more of the trace channels are missing. Cannot give you a length."); |
736
|
|
|
|
|
|
|
|
737
|
|
|
|
|
|
|
} |
738
|
57516
|
|
|
|
|
43417
|
my $lengtha = scalar(@{$self->trace('a')}); |
|
57516
|
|
|
|
|
55419
|
|
739
|
57516
|
|
|
|
|
34997
|
my $lengtht = scalar(@{$self->trace('t')}); |
|
57516
|
|
|
|
|
52084
|
|
740
|
57516
|
|
|
|
|
35619
|
my $lengthg = scalar(@{$self->trace('g')}); |
|
57516
|
|
|
|
|
54070
|
|
741
|
57516
|
|
|
|
|
37585
|
my $lengthc = scalar(@{$self->trace('c')}); |
|
57516
|
|
|
|
|
59377
|
|
742
|
57516
|
50
|
33
|
|
|
218948
|
if (($lengtha == $lengtht) && ($lengtha == $lengthg) && ($lengtha == $lengthc) ) { |
|
|
|
33
|
|
|
|
|
743
|
57516
|
|
|
|
|
118558
|
return $lengtha; |
744
|
|
|
|
|
|
|
} |
745
|
0
|
|
|
|
|
0
|
$self->warn("Not all of the trace indices are the same length". |
746
|
|
|
|
|
|
|
" Here are their lengths: a: $lengtha t:$lengtht ". |
747
|
|
|
|
|
|
|
" g: $lengthg c: $lengthc"); |
748
|
|
|
|
|
|
|
} |
749
|
|
|
|
|
|
|
|
750
|
|
|
|
|
|
|
|
751
|
|
|
|
|
|
|
|
752
|
|
|
|
|
|
|
=head2 sub_trace_object($start,$end) |
753
|
|
|
|
|
|
|
|
754
|
|
|
|
|
|
|
Title : sub_trace_object($start,$end) |
755
|
|
|
|
|
|
|
Usage : $smaller_object = $object->sub_trace_object('1','100'); |
756
|
|
|
|
|
|
|
Function: Get a subset of the sequence, its quality, and its trace. |
757
|
|
|
|
|
|
|
Returns : A reference to a Bio::Seq::SequenceTrace object |
758
|
|
|
|
|
|
|
Args : a start position and an end position |
759
|
|
|
|
|
|
|
Notes : |
760
|
|
|
|
|
|
|
- the start and end position refer to the positions of _bases_. |
761
|
|
|
|
|
|
|
- for example, to get a sub SequenceTrace for bases 5-10, |
762
|
|
|
|
|
|
|
use this routine. |
763
|
|
|
|
|
|
|
- you will get the bases, qualities, and the trace values |
764
|
|
|
|
|
|
|
- you can then use this object to synthesize a new scf |
765
|
|
|
|
|
|
|
using seqIO::scf. |
766
|
|
|
|
|
|
|
|
767
|
|
|
|
|
|
|
=cut |
768
|
|
|
|
|
|
|
|
769
|
|
|
|
|
|
|
sub sub_trace_object { |
770
|
2
|
|
|
2
|
1
|
410
|
my ($self,$start,$end) = @_; |
771
|
2
|
|
|
|
|
4
|
my ($start2,$end2); |
772
|
2
|
|
|
|
|
5
|
my @subs = @{$self->sub_peak_index($start,$end)}; |
|
2
|
|
|
|
|
7
|
|
773
|
2
|
|
|
|
|
7
|
$start2 = shift(@subs); |
774
|
2
|
|
|
|
|
4
|
$end2 = pop(@subs); |
775
|
2
|
|
|
|
|
12
|
my $new_object = Bio::Seq::SequenceTrace->new( |
776
|
|
|
|
|
|
|
-swq => Bio::Seq::Quality->new( |
777
|
|
|
|
|
|
|
-seq => $self->subseq($start,$end), |
778
|
|
|
|
|
|
|
-qual => $self->subqual($start,$end), |
779
|
|
|
|
|
|
|
-id => $self->id() |
780
|
|
|
|
|
|
|
), |
781
|
|
|
|
|
|
|
-trace_a => $self->sub_trace('a',$start2,$end2), |
782
|
|
|
|
|
|
|
-trace_t => $self->sub_trace('t',$start2,$end2), |
783
|
|
|
|
|
|
|
-trace_g => $self->sub_trace('g',$start2,$end2), |
784
|
|
|
|
|
|
|
-trace_c => $self->sub_trace('c',$start2,$end2), |
785
|
|
|
|
|
|
|
-peak_indices => $self->sub_peak_index($start,$end) |
786
|
|
|
|
|
|
|
|
787
|
|
|
|
|
|
|
); |
788
|
2
|
|
|
|
|
10
|
$new_object->set_accuracies(); |
789
|
2
|
|
|
|
|
7
|
$new_object->_reset_peak_indices(); |
790
|
2
|
|
|
|
|
10
|
return $new_object; |
791
|
|
|
|
|
|
|
} |
792
|
|
|
|
|
|
|
|
793
|
|
|
|
|
|
|
=head2 _synthesize_traces() |
794
|
|
|
|
|
|
|
|
795
|
|
|
|
|
|
|
Title : _synthesize_traces() |
796
|
|
|
|
|
|
|
Usage : $obj->_synthesize_traces(); |
797
|
|
|
|
|
|
|
Function: Synthesize false traces for this object. |
798
|
|
|
|
|
|
|
Returns : Nothing. |
799
|
|
|
|
|
|
|
Args : None. |
800
|
|
|
|
|
|
|
Notes : This method is intended to be invoked when this |
801
|
|
|
|
|
|
|
object is created with a SWQ object- that is to say that |
802
|
|
|
|
|
|
|
there is a sequence and a set of qualities but there was |
803
|
|
|
|
|
|
|
no actual trace data. |
804
|
|
|
|
|
|
|
|
805
|
|
|
|
|
|
|
=cut |
806
|
|
|
|
|
|
|
|
807
|
|
|
|
|
|
|
sub _synthesize_traces { |
808
|
4
|
|
|
4
|
|
367
|
my ($self) = shift; |
809
|
4
|
|
|
|
|
11
|
$self->peak_indices(qw()); |
810
|
|
|
|
|
|
|
#ml my $version = 2; |
811
|
|
|
|
|
|
|
# the user should be warned if traces already exist |
812
|
|
|
|
|
|
|
# |
813
|
|
|
|
|
|
|
# |
814
|
|
|
|
|
|
|
#ml ( my $sequence = $self->seq() ) =~ tr/a-z/A-Z/; |
815
|
|
|
|
|
|
|
#ml my @quals = @{$self->qual()}; |
816
|
|
|
|
|
|
|
#ml my $info; |
817
|
|
|
|
|
|
|
# build the ramp for the first base. |
818
|
|
|
|
|
|
|
# a ramp looks like this "1 4 13 29 51 71 80 71 51 29 13 4 1" times the quality score. |
819
|
|
|
|
|
|
|
# REMEMBER: A C G T |
820
|
|
|
|
|
|
|
# note to self-> smooth this thing out a bit later |
821
|
4
|
|
|
|
|
4
|
my $ramp_data; |
822
|
4
|
|
|
|
|
7
|
@{$ramp_data->{'ramp'}} = qw( 1 4 13 29 51 75 80 75 51 29 13 4 1 ); |
|
4
|
|
|
|
|
19
|
|
823
|
|
|
|
|
|
|
# the width of the ramp |
824
|
4
|
|
|
|
|
6
|
$ramp_data->{'ramp_width'} = scalar(@{$ramp_data->{'ramp'}}); |
|
4
|
|
|
|
|
13
|
|
825
|
|
|
|
|
|
|
# how far should the peaks overlap? |
826
|
4
|
|
|
|
|
8
|
$ramp_data->{'ramp_overlap'} = 1; |
827
|
|
|
|
|
|
|
# where should the peaks be located? |
828
|
4
|
|
|
|
|
6
|
$ramp_data->{'peak_at'} = 7; |
829
|
|
|
|
|
|
|
$ramp_data->{'ramp_total_length'} = |
830
|
|
|
|
|
|
|
$self->seq_obj()->length() * $ramp_data->{'ramp_width'} |
831
|
4
|
|
|
|
|
8
|
- $self->seq_obj()->length() * $ramp_data->{'ramp_overlap'}; |
832
|
4
|
|
|
|
|
7
|
my $pos; |
833
|
4
|
|
|
|
|
6
|
my $total_length = $ramp_data->{ramp_total_length}; |
834
|
4
|
|
|
|
|
16
|
$self->initialize_traces("0",$total_length+2); |
835
|
|
|
|
|
|
|
# now populate them |
836
|
4
|
|
|
|
|
6
|
my ($current_base,$place_base_at,$peak_quality,$ramp_counter,$current_ramp,$ramp_position); |
837
|
|
|
|
|
|
|
#ml my $sequence_length = $self->length(); |
838
|
4
|
|
|
|
|
19
|
my $half_ramp = int($ramp_data->{'ramp_width'}/2); |
839
|
4
|
|
|
|
|
17
|
for ($pos = 0; $pos<$self->length();$pos++) { |
840
|
82
|
|
|
|
|
100
|
$current_base = uc $self->seq_obj()->subseq($pos+1,$pos+1); |
841
|
|
|
|
|
|
|
# print("Synthesizing the ramp for $current_base\n"); |
842
|
82
|
|
|
|
|
73
|
my $all_bases = "ATGC"; |
843
|
82
|
|
|
|
|
103
|
$peak_quality = $self->qual_obj()->qualat($pos+1); |
844
|
|
|
|
|
|
|
# where should the peak for this base be placed? Modeled after a mktrace scf |
845
|
|
|
|
|
|
|
$place_base_at = ($pos * $ramp_data->{'ramp_width'}) - |
846
|
|
|
|
|
|
|
($pos * $ramp_data->{'ramp_overlap'}) - |
847
|
82
|
|
|
|
|
153
|
$half_ramp + $ramp_data->{'ramp_width'} - 1; |
848
|
|
|
|
|
|
|
# print("Placing this base at this position: $place_base_at\n"); |
849
|
82
|
|
|
|
|
57
|
push @{$self->peak_indices()},$place_base_at; |
|
82
|
|
|
|
|
91
|
|
850
|
82
|
|
|
|
|
64
|
$ramp_position = $place_base_at - $half_ramp; |
851
|
82
|
50
|
|
|
|
143
|
if ($current_base =~ "N" ) { |
852
|
0
|
|
|
|
|
0
|
$current_base = "A"; |
853
|
|
|
|
|
|
|
} |
854
|
82
|
|
|
|
|
126
|
for ($current_ramp = 0; $current_ramp < $ramp_data->{'ramp_width'}; $current_ramp++) { |
855
|
|
|
|
|
|
|
# print("Placing a trace value here: $current_base ".($ramp_position+$current_ramp+1)." ".$peak_quality*$ramp_data->{'ramp'}->[$current_ramp]."\n"); |
856
|
1066
|
|
|
|
|
1632
|
$self->trace_value_at($current_base,$ramp_position+$current_ramp+1,$peak_quality*$ramp_data->{'ramp'}->[$current_ramp]); |
857
|
|
|
|
|
|
|
} |
858
|
82
|
|
|
|
|
127
|
$self->peak_index_at($pos+1, |
859
|
|
|
|
|
|
|
$place_base_at+1 |
860
|
|
|
|
|
|
|
); |
861
|
|
|
|
|
|
|
#ml my $other_bases = $self->_get_other_bases($current_base); |
862
|
|
|
|
|
|
|
# foreach ( split('',$other_bases) ) { |
863
|
|
|
|
|
|
|
# push @{$self->{'text'}->{"v3_base_accuracy"}->{$_}},0; |
864
|
|
|
|
|
|
|
#} |
865
|
|
|
|
|
|
|
} |
866
|
|
|
|
|
|
|
} |
867
|
|
|
|
|
|
|
|
868
|
|
|
|
|
|
|
|
869
|
|
|
|
|
|
|
|
870
|
|
|
|
|
|
|
|
871
|
|
|
|
|
|
|
|
872
|
|
|
|
|
|
|
=head2 _dump_traces($transformed) |
873
|
|
|
|
|
|
|
|
874
|
|
|
|
|
|
|
Title : _dump_traces("transformed") |
875
|
|
|
|
|
|
|
Usage : &_dump_traces($ra,$rc,$rg,$rt); |
876
|
|
|
|
|
|
|
Function: Used in debugging. Prints all traces one beside each other. |
877
|
|
|
|
|
|
|
Returns : Nothing. |
878
|
|
|
|
|
|
|
Args : References to the arrays containing the traces for A,C,G,T. |
879
|
|
|
|
|
|
|
Notes : Beats using dumpValue, I'll tell ya. Much better then using |
880
|
|
|
|
|
|
|
join' ' too. |
881
|
|
|
|
|
|
|
- if a scalar is included as an argument (any scalar), this |
882
|
|
|
|
|
|
|
procedure will dump the _delta'd trace. If you don't know what |
883
|
|
|
|
|
|
|
that means you should not be using this. |
884
|
|
|
|
|
|
|
|
885
|
|
|
|
|
|
|
=cut |
886
|
|
|
|
|
|
|
|
887
|
|
|
|
|
|
|
#' |
888
|
|
|
|
|
|
|
sub _dump_traces { |
889
|
0
|
|
|
0
|
|
0
|
my ($self) = @_; |
890
|
0
|
|
|
|
|
0
|
my (@sA,@sT,@sG,@sC); |
891
|
0
|
|
|
|
|
0
|
print ("Count\ta\tc\tg\tt\n"); |
892
|
0
|
|
|
|
|
0
|
my $length = $self->trace_length(); |
893
|
0
|
|
|
|
|
0
|
for (my $curr=1; $curr <= $length; $curr++) { |
894
|
0
|
|
|
|
|
0
|
print(($curr-1)."\t".$self->trace_value_at('a',$curr). |
895
|
|
|
|
|
|
|
"\t".$self->trace_value_at('c',$curr). |
896
|
|
|
|
|
|
|
"\t".$self->trace_value_at('g',$curr). |
897
|
|
|
|
|
|
|
"\t".$self->trace_value_at('t',$curr)."\n"); |
898
|
|
|
|
|
|
|
} |
899
|
0
|
|
|
|
|
0
|
return; |
900
|
|
|
|
|
|
|
} |
901
|
|
|
|
|
|
|
|
902
|
|
|
|
|
|
|
=head2 _initialize_traces() |
903
|
|
|
|
|
|
|
|
904
|
|
|
|
|
|
|
Title : _initialize_traces() |
905
|
|
|
|
|
|
|
Usage : $trace_object->_initialize_traces(); |
906
|
|
|
|
|
|
|
Function: Creates empty arrays to hold synthetic trace values. |
907
|
|
|
|
|
|
|
Returns : Nothing. |
908
|
|
|
|
|
|
|
Args : None. |
909
|
|
|
|
|
|
|
|
910
|
|
|
|
|
|
|
=cut |
911
|
|
|
|
|
|
|
|
912
|
|
|
|
|
|
|
sub initialize_traces { |
913
|
4
|
|
|
4
|
0
|
7
|
my ($self,$value,$length) = @_; |
914
|
4
|
|
|
|
|
7
|
foreach (qw(a t g c)) { |
915
|
16
|
|
|
|
|
12
|
my @temp; |
916
|
16
|
|
|
|
|
32
|
for (my $count=0; $count<$length; $count++) { |
917
|
3968
|
|
|
|
|
5408
|
$temp[$count] = $value; |
918
|
|
|
|
|
|
|
} |
919
|
16
|
|
|
|
|
34
|
$self->trace($_,\@temp); |
920
|
|
|
|
|
|
|
} |
921
|
|
|
|
|
|
|
} |
922
|
|
|
|
|
|
|
|
923
|
|
|
|
|
|
|
=head2 trace_value_at($channel,$position) |
924
|
|
|
|
|
|
|
|
925
|
|
|
|
|
|
|
Title : trace_value_at($channel,$position) |
926
|
|
|
|
|
|
|
Usage : $value = $trace_object->trace_value_at($channel,$position); |
927
|
|
|
|
|
|
|
Function: What is the value of the trace for this base at this position? |
928
|
|
|
|
|
|
|
Returns : A scalar represnting the trace value here. |
929
|
|
|
|
|
|
|
Args : a base channel (a,t,g,c) |
930
|
|
|
|
|
|
|
a position ( < $trace_object->trace_length() ) |
931
|
|
|
|
|
|
|
|
932
|
|
|
|
|
|
|
=cut |
933
|
|
|
|
|
|
|
|
934
|
|
|
|
|
|
|
sub trace_value_at { |
935
|
57495
|
|
|
57495
|
1
|
47975
|
my ($self,$channel,$position,$value) = @_; |
936
|
57495
|
100
|
|
|
|
64250
|
if ($value) { |
937
|
1066
|
|
|
|
|
927
|
$self->trace($channel)->[$position] = $value; |
938
|
|
|
|
|
|
|
} |
939
|
57495
|
|
|
|
|
61199
|
return $self->sub_trace($channel,($position),($position))->[0]; |
940
|
|
|
|
|
|
|
} |
941
|
|
|
|
|
|
|
|
942
|
|
|
|
|
|
|
sub _deprecated_get_scf_version_2_base_structure { |
943
|
|
|
|
|
|
|
# this sub is deprecated- check inside SeqIO::scf |
944
|
0
|
|
|
0
|
|
0
|
my $self = shift; |
945
|
0
|
|
|
|
|
0
|
my (@structure,$current); |
946
|
0
|
|
|
|
|
0
|
my $length = $self->length(); |
947
|
0
|
|
|
|
|
0
|
for ($current=1; $current <= $self->length() ; $current++) { |
948
|
0
|
|
|
|
|
0
|
my $base_here = $self->seq_obj()->subseq($current,$current); |
949
|
0
|
|
|
|
|
0
|
$base_here = lc($base_here); |
950
|
0
|
|
|
|
|
0
|
my $probabilities; |
951
|
0
|
|
|
|
|
0
|
$probabilities->{$base_here} = $self->qual_obj()->qualat($current); |
952
|
0
|
|
|
|
|
0
|
my $other_bases = "atgc"; |
953
|
0
|
|
|
|
|
0
|
my $empty = ""; |
954
|
0
|
|
|
|
|
0
|
$other_bases =~ s/$base_here/$empty/e; |
|
0
|
|
|
|
|
0
|
|
955
|
0
|
|
|
|
|
0
|
foreach ( split('',$other_bases) ) { |
956
|
0
|
|
|
|
|
0
|
$probabilities->{$_} = "0"; |
957
|
|
|
|
|
|
|
} |
958
|
|
|
|
|
|
|
@structure = ( |
959
|
|
|
|
|
|
|
@structure, |
960
|
|
|
|
|
|
|
$self->peak_index_at($current), |
961
|
|
|
|
|
|
|
$probabilities->{'a'}, |
962
|
|
|
|
|
|
|
$probabilities->{'t'}, |
963
|
|
|
|
|
|
|
$probabilities->{'g'}, |
964
|
0
|
|
|
|
|
0
|
$probabilities->{'c'} |
965
|
|
|
|
|
|
|
); |
966
|
|
|
|
|
|
|
|
967
|
|
|
|
|
|
|
} |
968
|
0
|
|
|
|
|
0
|
return \@structure; |
969
|
|
|
|
|
|
|
} |
970
|
|
|
|
|
|
|
|
971
|
|
|
|
|
|
|
sub _deprecated_get_scf_version_3_base_structure { |
972
|
0
|
|
|
0
|
|
0
|
my $self = shift; |
973
|
0
|
|
|
|
|
0
|
my $structure; |
974
|
0
|
|
|
|
|
0
|
$structure = join('',$self->peak_indices()); |
975
|
0
|
|
|
|
|
0
|
return $structure; |
976
|
|
|
|
|
|
|
} |
977
|
|
|
|
|
|
|
|
978
|
|
|
|
|
|
|
|
979
|
|
|
|
|
|
|
=head2 accuracies($channel,$position) |
980
|
|
|
|
|
|
|
|
981
|
|
|
|
|
|
|
Title : trace_value_at($channel,$position) |
982
|
|
|
|
|
|
|
Usage : $value = $trace_object->trace_value_at($channel,$position); |
983
|
|
|
|
|
|
|
Function: What is the value of the trace for this base at this position? |
984
|
|
|
|
|
|
|
Returns : A scalar representing the trace value here. |
985
|
|
|
|
|
|
|
Args : a base channel (a,t,g,c) |
986
|
|
|
|
|
|
|
a position ( < $trace_object->trace_length() ) |
987
|
|
|
|
|
|
|
|
988
|
|
|
|
|
|
|
=cut |
989
|
|
|
|
|
|
|
|
990
|
|
|
|
|
|
|
|
991
|
|
|
|
|
|
|
sub accuracies { |
992
|
133
|
|
|
133
|
1
|
133
|
my ($self,$channel,$value) = @_; |
993
|
133
|
100
|
|
|
|
178
|
if ($value) { |
994
|
61
|
100
|
|
|
|
97
|
if (ref($value) eq "ARRAY") { |
995
|
60
|
|
|
|
|
90
|
$self->{accuracies}->{$channel} = $value; |
996
|
|
|
|
|
|
|
} |
997
|
|
|
|
|
|
|
else { |
998
|
1
|
|
|
|
|
4
|
my @acc = split(' ',$value); |
999
|
1
|
|
|
|
|
15
|
$self->{accuracies}->{$channel} = \@acc; |
1000
|
|
|
|
|
|
|
} |
1001
|
|
|
|
|
|
|
} |
1002
|
133
|
|
|
|
|
1546
|
return $self->{accuracies}->{$channel}; |
1003
|
|
|
|
|
|
|
} |
1004
|
|
|
|
|
|
|
|
1005
|
|
|
|
|
|
|
|
1006
|
|
|
|
|
|
|
=head2 set_accuracies() |
1007
|
|
|
|
|
|
|
|
1008
|
|
|
|
|
|
|
Title : set_sccuracies() |
1009
|
|
|
|
|
|
|
Usage : $trace_object->set_accuracies(); |
1010
|
|
|
|
|
|
|
Function: Take a sequence's quality and synthesize proper scf-style |
1011
|
|
|
|
|
|
|
base accuracies that can then be accessed with |
1012
|
|
|
|
|
|
|
accuracies("a") or something like it. |
1013
|
|
|
|
|
|
|
Returns : Nothing. |
1014
|
|
|
|
|
|
|
Args : None. |
1015
|
|
|
|
|
|
|
|
1016
|
|
|
|
|
|
|
=cut |
1017
|
|
|
|
|
|
|
|
1018
|
|
|
|
|
|
|
sub set_accuracies { |
1019
|
8
|
|
|
8
|
1
|
12
|
my $self = shift; |
1020
|
8
|
|
|
|
|
11
|
my $count = 0; |
1021
|
8
|
|
|
|
|
22
|
my $length = $self->length(); |
1022
|
8
|
|
|
|
|
25
|
for ($count=1; $count <= $length; $count++) { |
1023
|
184
|
|
|
|
|
221
|
my $base_here = $self->seq_obj()->subseq($count,$count); |
1024
|
184
|
|
|
|
|
233
|
my $qual_here = $self->qual_obj()->qualat($count); |
1025
|
184
|
|
|
|
|
298
|
$self->accuracy_at($base_here,$count,$qual_here); |
1026
|
184
|
|
|
|
|
197
|
my $other_bases = $self->_get_other_bases($base_here); |
1027
|
184
|
|
|
|
|
425
|
foreach (split('',$other_bases)) { |
1028
|
552
|
|
|
|
|
588
|
$self->accuracy_at($_,$count,"null"); |
1029
|
|
|
|
|
|
|
} |
1030
|
|
|
|
|
|
|
} |
1031
|
|
|
|
|
|
|
} |
1032
|
|
|
|
|
|
|
|
1033
|
|
|
|
|
|
|
|
1034
|
|
|
|
|
|
|
=head2 scf_dump() |
1035
|
|
|
|
|
|
|
|
1036
|
|
|
|
|
|
|
Title : scf_dump() |
1037
|
|
|
|
|
|
|
Usage : $trace_object->scf_dump(); |
1038
|
|
|
|
|
|
|
Function: Prints out the contents of the structures representing |
1039
|
|
|
|
|
|
|
the SequenceTrace in a manner similar to io_lib's scf_dump. |
1040
|
|
|
|
|
|
|
Returns : Nothing. Prints out the contents of the structures |
1041
|
|
|
|
|
|
|
used to represent the sequence and its trace. |
1042
|
|
|
|
|
|
|
Args : None. |
1043
|
|
|
|
|
|
|
Notes : Used in debugging, obviously. |
1044
|
|
|
|
|
|
|
|
1045
|
|
|
|
|
|
|
=cut |
1046
|
|
|
|
|
|
|
|
1047
|
|
|
|
|
|
|
sub scf_dump { |
1048
|
0
|
|
|
0
|
1
|
0
|
my $self = shift; |
1049
|
0
|
|
|
|
|
0
|
my $count; |
1050
|
0
|
|
|
|
|
0
|
for ($count=1;$count<=$self->length();$count++) { |
1051
|
0
|
|
|
|
|
0
|
my $base_here = lc($self->seq_obj()->subseq($count,$count)); |
1052
|
0
|
|
|
|
|
0
|
print($base_here." ".sprintf("%05d",$self->peak_index_at($count))."\t"); |
1053
|
0
|
|
|
|
|
0
|
foreach (sort qw(a c g t)) { |
1054
|
0
|
|
|
|
|
0
|
print(sprintf("%03d",$self->accuracy_at($_,$count))."\t"); |
1055
|
|
|
|
|
|
|
} |
1056
|
0
|
|
|
|
|
0
|
print("\n"); |
1057
|
|
|
|
|
|
|
} |
1058
|
0
|
|
|
|
|
0
|
$self->_dump_traces(); |
1059
|
|
|
|
|
|
|
} |
1060
|
|
|
|
|
|
|
|
1061
|
|
|
|
|
|
|
=head2 _get_other_bases($this_base) |
1062
|
|
|
|
|
|
|
|
1063
|
|
|
|
|
|
|
Title : _get_other_bases($this_base) |
1064
|
|
|
|
|
|
|
Usage : $other_bases = $trace_object->_get_other_bases($this_base); |
1065
|
|
|
|
|
|
|
Function: A utility routine to return bases other then the one provided. |
1066
|
|
|
|
|
|
|
I was doing this over and over so I put it here. |
1067
|
|
|
|
|
|
|
Returns : Three of a,t,g and c. |
1068
|
|
|
|
|
|
|
Args : A base (atgc) |
1069
|
|
|
|
|
|
|
Notes : $obj->_get_other_bases("a") returns "tgc" |
1070
|
|
|
|
|
|
|
|
1071
|
|
|
|
|
|
|
=cut |
1072
|
|
|
|
|
|
|
|
1073
|
|
|
|
|
|
|
sub _get_other_bases { |
1074
|
184
|
|
|
184
|
|
145
|
my ($self,$this_base) = @_; |
1075
|
184
|
|
|
|
|
164
|
$this_base = lc($this_base); |
1076
|
184
|
|
|
|
|
134
|
my $all_bases = "atgc"; |
1077
|
184
|
|
|
|
|
123
|
my $empty = ""; |
1078
|
184
|
|
|
|
|
1192
|
$all_bases =~ s/$this_base/$empty/e; |
|
184
|
|
|
|
|
273
|
|
1079
|
184
|
|
|
|
|
280
|
return $all_bases; |
1080
|
|
|
|
|
|
|
} |
1081
|
|
|
|
|
|
|
|
1082
|
|
|
|
|
|
|
|
1083
|
|
|
|
|
|
|
=head2 accuracy_at($base,$position) |
1084
|
|
|
|
|
|
|
|
1085
|
|
|
|
|
|
|
Title : accuracy_at($base,$position) |
1086
|
|
|
|
|
|
|
Usage : $accuracy = $trace_object->accuracy_at($base,$position); |
1087
|
|
|
|
|
|
|
Function: |
1088
|
|
|
|
|
|
|
Returns : Returns the accuracy of finding $base at $position. |
1089
|
|
|
|
|
|
|
Args : 1. a base channel (atgc) 2. a value to _set_ the accuracy |
1090
|
|
|
|
|
|
|
Notes : $obj->_get_other_bases("a") returns "tgc" |
1091
|
|
|
|
|
|
|
|
1092
|
|
|
|
|
|
|
=cut |
1093
|
|
|
|
|
|
|
|
1094
|
|
|
|
|
|
|
|
1095
|
|
|
|
|
|
|
sub accuracy_at { |
1096
|
5161
|
|
|
5161
|
1
|
3778
|
my ($self,$base,$position,$value) = @_; |
1097
|
5161
|
|
|
|
|
3338
|
$base = lc($base); |
1098
|
5161
|
100
|
|
|
|
5214
|
if ($value) { |
1099
|
736
|
100
|
|
|
|
719
|
if ($value eq "null") { |
1100
|
552
|
|
|
|
|
646
|
$self->{accuracies}->{$base}->[$position-1] = "0"; |
1101
|
|
|
|
|
|
|
} |
1102
|
|
|
|
|
|
|
else { |
1103
|
184
|
|
|
|
|
270
|
$self->{accuracies}->{$base}->[$position-1] = $value; |
1104
|
|
|
|
|
|
|
} |
1105
|
|
|
|
|
|
|
} |
1106
|
5161
|
|
|
|
|
5780
|
return $self->{accuracies}->{$base}->[$position-1]; |
1107
|
|
|
|
|
|
|
} |
1108
|
|
|
|
|
|
|
|
1109
|
|
|
|
|
|
|
1; |
1110
|
|
|
|
|
|
|
|