File Coverage

Bio/SeqIO/scf.pm

Criterion	Covered	Total	%
statement	371	518	71.6
branch	77	142	54.2
condition	4	14	28.5
subroutine	26	37	70.2
pod	5	6	83.3
total	483	717	67.3

line	stmt	bran	cond	sub	pod	time	code
1							#
2							# Copyright (c) 1997-2001 bioperl, Chad Matsalla. All Rights Reserved.
3							# This module is free software; you can redistribute it and/or
4							# modify it under the same terms as Perl itself.
5							#
6							# Copyright Chad Matsalla
7							#
8							# You may distribute this module under the same terms as perl itself
9
10							# POD documentation - main docs before the code
11
12							=head1 NAME
13
14							Bio::SeqIO::scf - .scf file input/output stream
15
16							=head1 SYNOPSIS
17
18							Do not use this module directly. Use it via the Bio::SeqIO class, see
19							L for more information.
20
21							=head1 DESCRIPTION
22
23							This object can transform .scf files to and from Bio::Seq::SequenceTrace
24							objects. Mechanisms are present to retrieve trace data from scf
25							files.
26
27							=head1 FEEDBACK
28
29							=head2 Mailing Lists
30
31							User feedback is an integral part of the evolution of this and other
32							Bioperl modules. Send your comments and suggestions preferably to one
33							of the Bioperl mailing lists. Your participation is much appreciated.
34
35							bioperl-l@bioperl.org - General discussion
36							http://bioperl.org/wiki/Mailing_lists - About the mailing lists
37
38							=head2 Support
39
40							Please direct usage questions or support issues to the mailing list:
41
42							I
43
44							rather than to the module maintainer directly. Many experienced and
45							reponsive experts will be able look at the problem and quickly
46							address it. Please include a thorough description of the problem
47							with code and data examples if at all possible.
48
49							=head2 Reporting Bugs
50
51							Report bugs to the Bioperl bug tracking system to help us keep track
52							the bugs and their resolution. Bug reports can be submitted via
53							the web:
54
55							https://github.com/bioperl/bioperl-live/issues
56
57							=head1 AUTHOR Chad Matsalla
58
59							Chad Matsalla
60							bioinformatics@dieselwurks.com
61
62							=head1 CONTRIBUTORS
63
64							Jason Stajich, jason@bioperl.org
65							Tony Cox, avc@sanger.ac.uk
66							Heikki Lehvaslaiho, heikki-at-bioperl-dot-org
67							Nancy Hansen, nhansen at mail.nih.gov
68
69							=head1 APPENDIX
70
71							The rest of the documentation details each of the object
72							methods. Internal methods are usually preceded with a _
73
74							=cut
75
76							# Let the code begin...
77
78							package Bio::SeqIO::scf;
79	1			1		548	use vars qw($DEFAULT_QUALITY);
	1					1
	1					34
80	1			1		3	use strict;
	1					1
	1					15
81	1			1		241	use Bio::Seq::SeqFactory;
	1					1
	1					21
82	1			1		391	use Bio::Seq::SequenceTrace;
	1					2
	1					37
83	1			1		237	use Bio::Annotation::Comment;
	1					1
	1					21
84	1			1		4	use Dumpvalue;
	1					1
	1					29
85
86							my $dumper = Dumpvalue->new();
87							$dumper->veryCompact(1);
88
89							BEGIN {
90	1			1		14	$DEFAULT_QUALITY= 10;
91							}
92
93	1			1		3	use base qw(Bio::SeqIO);
	1					1
	1					326
94
95							sub _initialize {
96	25			25		53	my($self,@args) = @_;
97	25					75	$self->SUPER::_initialize(@args);
98	25	50				181	if( ! defined $self->sequence_factory ) {
99	25					81	$self->sequence_factory(Bio::Seq::SeqFactory->new
100							(-verbose => $self->verbose(),
101							-type => 'Bio::Seq::Quality'));
102							}
103	25					53	binmode $self->_fh; # for the Win32/Mac crowds
104							}
105
106							=head2 next_seq()
107
108							Title : next_seq()
109							Usage : $scf = $stream->next_seq()
110							Function: returns the next scf sequence in the stream
111							Returns : a Bio::Seq::SequenceTrace object
112							Args : NONE
113							Notes : Fills the interface specification for SeqIO.
114							The SCF specification does not provide for having more then
115							one sequence in a given scf. So once the filehandle has been open
116							and passed to SeqIO do not expect to run this function more then
117							once on a given scf unless you embraced and extended the SCF
118							standard. SCF comments are accessible through the Bio::SeqI
119							interface method annotation().
120
121							=cut
122
123							#'
124							sub next_seq {
125	15			15	1	52	my ($self) = @_;
126	15					29	my ($seq, $seqc, $fh, $buffer, $offset, $length, $read_bytes, @read,
127							%names);
128							# set up a filehandle to read in the scf
129	15	50				43	return if $self->{_readfile};
130	15					39	$fh = $self->_fh();
131	15	50				50	unless ($fh) { # simulate the <> function
132	0	0	0			0	if ( !fileno(ARGV) or eof(ARGV) ) {
133	0	0				0	return unless my $ARGV = shift;
134	0	0				0	open(ARGV,$ARGV) or
135							$self->throw("Could not open $ARGV for SCF stream reading $!");
136							}
137	0					0	$fh = \*ARGV;
138							}
139	15	50				217	return unless read $fh, $buffer, 128; # no exception; probably end of file
140							# now, the master data structure will be the creator
141	15					24	my $creator;
142							# he first thing to do is parse the header. This is common
143							# among all versions of scf.
144							# the rest of the the information is different between the
145							# the different versions of scf.
146
147	15					49	$creator->{header} = $self->_get_header($buffer);
148	15	100				51	if ($creator->{header}->{'version'} lt "3.00") {
149	4					18	$self->debug("scf.pm is working with a version 2 scf.\n");
150							# first gather the trace information
151							$length = $creator->{header}->{'samples'} *
152	4					12	$creator->{header}->{sample_size}*4;
153							$buffer = $self->read_from_buffer($fh, $buffer, $length,
154	4					20	$creator->{header}->{samples_offset});
155							# @read = unpack "n$length",$buffer;
156							# these traces need to be split
157							# returns a reference to a hash
158							$creator->{traces} = $self->_parse_v2_traces(
159	4					22	$buffer,$creator->{header}->{sample_size});
160							# now go and get the base information
161	4					14	$offset = $creator->{header}->{bases_offset};
162	4					16	$length = ($creator->{header}->{bases} * 12);
163	4					44	seek $fh,$offset,0;
164	4					33	$buffer = $self->read_from_buffer($fh,$buffer,$length,$creator->{header}->{bases_offset});
165							# now distill the information into its fractions.
166							# the old way : $self->_set_v2_bases($buffer);
167							# ref to an array, ref to a hash, string
168							($creator->{peak_indices},
169							$creator->{qualities},
170							$creator->{sequence},
171	4					24	$creator->{accuracies}) = $self->_parse_v2_bases($buffer);
172
173							} else {
174	11					35	$self->debug("scf.pm is working with a version 3+ scf.\n");
175	11					13	my $transformed_read;
176	11					20	my $current_read_position = $creator->{header}->{sample_offset};
177							$length = $creator->{header}->{'samples'}*
178	11					22	$creator->{header}->{sample_size};
179							# $dumper->dumpValue($creator->{header});
180	11					34	foreach (qw(a c g t)) {
181	44					163	$buffer = $self->read_from_buffer($fh,$buffer,$length,$current_read_position);
182	44					84	my $byte = "n";
183	44	50				124	if ($creator->{header}->{sample_size} == 1) {
184	0					0	$byte = "c";
185							}
186	44					29461	@read = unpack "${byte}${length}",$buffer;
187							# this little spurt of nonsense is because
188							# the trace values are given in the binary
189							# file as unsigned shorts but they really
190							# are signed deltas. 30000 is an arbitrary number
191							# (will there be any traces with a given
192							# point greater then 30000? I hope not.
193							# once the read is read, it must be changed
194							# from relative
195	44					6420	foreach (@read) {
196	424924	100				431702	if ($_ > 30000) {
197	142333					90688	$_ -= 65536;
198							}
199							}
200	44					230	$transformed_read = $self->_delta(\@read,"backward");
201							# For 8-bit data we need to emulate a signed/unsigned
202							# cast that is implicit in the C implementations.....
203	44	50				16353	if ($creator->{header}->{sample_size} == 1) {
204	0					0	foreach (@{$transformed_read}) {
	0					0
205	0	0				0	$_ += 256 if ($_ < 0);
206							}
207							}
208	44					60	$current_read_position += $length;
209	44					47	$creator->{'traces'}->{$_} = join(' ',@{$transformed_read});
	44					51544
210							}
211
212							# now go and get the peak index information
213	11					29	$offset = $creator->{header}->{bases_offset};
214	11					26	$length = ($creator->{header}->{bases} * 4);
215	11					56	$buffer = $self->read_from_buffer($fh,$buffer,$length,$offset);
216	11					41	$creator->{peak_indices} = $self->_get_v3_peak_indices($buffer);
217	11					22	$offset += $length;
218							# now go and get the accuracy information
219	11					51	$buffer = $self->read_from_buffer($fh,$buffer,$length,$offset);
220	11					40	$creator->{accuracies} = $self->_get_v3_base_accuracies($buffer);
221							# OK, now go and get the base information.
222	11					18	$offset += $length;
223	11					22	$length = $creator->{header}->{bases};
224	11					22	$buffer = $self->read_from_buffer($fh,$buffer,$length,$offset);
225	11					57	$creator->{'sequence'} = unpack("a$length",$buffer);
226							# now, finally, extract the calls from the accuracy information.
227							$creator->{qualities} = $self->_get_v3_quality(
228	11					46	$creator->{'sequence'},$creator->{accuracies});
229							}
230							# now go and get the comment information
231	15					53	$offset = $creator->{header}->{comments_offset};
232	15					68	seek $fh,$offset,0;
233	15					21	$length = $creator->{header}->{comment_size};
234	15					61	$buffer = $self->read_from_buffer($fh,$buffer,$length);
235	15					56	$creator->{comments} = $self->_get_comments($buffer);
236	74					84	my @name_comments = grep {$_->tagname() eq 'NAME'}
237	15					81	$creator->{comments}->get_Annotations('comment');
238	15					19	my $name_comment;
239	15	100				27	if (@name_comments){
240	7					25	$name_comment = $name_comments[0]->as_text();
241	7					29	$name_comment =~ s/^Comment:\s+//;
242							}
243
244							my $swq = Bio::Seq::Quality->new(
245							-seq => $creator->{'sequence'},
246	15					146	-qual => $creator->{'qualities'},
247							-id => $name_comment
248							);
249							my $returner = Bio::Seq::SequenceTrace->new(
250							-swq => $swq,
251							-trace_a => $creator->{'traces'}->{'a'},
252							-trace_t => $creator->{'traces'}->{'t'},
253							-trace_g => $creator->{'traces'}->{'g'},
254							-trace_c => $creator->{'traces'}->{'c'},
255							-accuracy_a => $creator->{'accuracies'}->{'a'},
256							-accuracy_t => $creator->{'accuracies'}->{'t'},
257							-accuracy_g => $creator->{'accuracies'}->{'g'},
258							-accuracy_c => $creator->{'accuracies'}->{'c'},
259	15					250	-peak_indices => $creator->{'peak_indices'}
260							);
261
262	15					91	$returner->annotation($creator->{'comments'}); # add SCF comments
263	15					30	$self->{'_readfile'} = 1;
264	15					2350	return $returner;
265							}
266
267
268							=head2 _get_v3_quality()
269
270							Title : _get_v3_quality()
271							Usage : $self->_get_v3_quality()
272							Function: Set the base qualities from version3 scf
273							Returns : Nothing. Alters $self.
274							Args : None.
275							Notes :
276
277							=cut
278
279							#'
280							sub _get_v3_quality {
281	11			11		24	my ($self,$sequence,$accuracies) = @_;
282	11					626	my @bases = split//,$sequence;
283	11					14	my (@qualities,$currbase,$currqual,$counter);
284	11					38	for ($counter=0; $counter <= $#bases ; $counter++) {
285	7639					5025	$currbase = lc($bases[$counter]);
286	7639	100				9456	if ($currbase eq "a") { $currqual = $accuracies->{'a'}->[$counter]; }
	1733	100				1257
		100
		50
287	2691					1834	elsif ($currbase eq "c") { $currqual = $accuracies->{'c'}->[$counter]; }
288	1227					918	elsif ($currbase eq "g") { $currqual = $accuracies->{'g'}->[$counter]; }
289	1988					1456	elsif ($currbase eq "t") { $currqual = $accuracies->{'t'}->[$counter]; }
290	0					0	else { $currqual = "unknown"; }
291	7639					9120	push @qualities,$currqual;
292							}
293	11					5030	return \@qualities;
294							}
295
296							=head2 _get_v3_peak_indices($buffer)
297
298							Title : _get_v3_peak_indices($buffer)
299							Usage : $self->_get_v3_peak_indices($buffer);
300							Function: Unpacks the base accuracies for version3 scf
301							Returns : Nothing. Alters $self
302							Args : A scalar containing binary data.
303							Notes :
304
305							=cut
306
307							sub _get_v3_peak_indices {
308	11			11		16	my ($self,$buffer) = @_;
309	11					17	my $length = length($buffer);
310	11					534	my @read = unpack "N$length",$buffer;
311	11					1397	return join(' ',@read);
312							}
313
314							=head2 _get_v3_base_accuracies($buffer)
315
316							Title : _get_v3_base_accuracies($buffer)
317							Usage : $self->_get_v3_base_accuracies($buffer)
318							Function: Set the base accuracies for version 3 scf's
319							Returns : Nothing. Alters $self.
320							Args : A scalar containing binary data.
321							Notes :
322
323							=cut
324
325							#'
326							sub _get_v3_base_accuracies {
327	11			11		16	my ($self,$buffer) = @_;
328	11					13	my $length = length($buffer);
329	11					22	my $qlength = $length/4;
330	11					12	my $offset = 0;
331	11					11	my (@qualities,@sorter,$counter,$round,$last_base,$accuracies,$currbase);
332	11					21	foreach $currbase (qw(a c g t)) {
333	44					41	my @read;
334	44					39	$last_base = $offset + $qlength;
335	44					68	for (;$offset < $last_base; $offset += $qlength) {
336							# a bioperler (perhaps me?) changed the unpack string to include 'n' rather than 'C'
337							# on 040322 I think that 'C' is correct. please email chad if you would like to accuse me of being incorrect
338	44					1593	@read = unpack "C$qlength", substr($buffer,$offset,$qlength);
339	44					600	$accuracies->{$currbase} = \@read;
340							}
341							}
342	11					28	return $accuracies;
343							}
344
345
346							=head2 _get_comments($buffer)
347
348							Title : _get_comments($buffer)
349							Usage : $self->_get_comments($buffer);
350							Function: Gather the comments section from the scf and parse it into its
351							components.
352							Returns : a Bio::Annotation::Collection object
353							Args : The buffer. It is expected that the buffer contains a binary
354							string for the comments section of an scf file according to
355							the scf file specifications.
356							Notes :
357
358							=cut
359
360							sub _get_comments {
361	15			15		26	my ($self,$buffer) = @_;
362	15					211	my $comments = Bio::Annotation::Collection->new();
363	15					32	my $size = length($buffer);
364	15					68	my $comments_retrieved = unpack "a$size",$buffer;
365	15					90	$comments_retrieved =~ s/\0//;
366	15					69	my @comments_split = split/\n/,$comments_retrieved;
367	15	100				48	if (@comments_split) {
368	13					38	foreach (@comments_split) {
369	100					323	/(\w+)=(.*)/;
370	100	100	33			348	if ($1 && $2) {
371	74					116	my ($tagname, $text) = ($1, $2);
372	74					331	my $comment_obj = Bio::Annotation::Comment->new(
373							-text => $text,
374							-tagname => $tagname);
375
376	74					163	$comments->add_Annotation('comment', $comment_obj);
377							}
378							}
379							}
380	15					36	$self->{'comments'} = $comments;
381	15					38	return $comments;
382							}
383
384							=head2 _get_header()
385
386							Title : _get_header($buffer)
387							Usage : $self->_get_header($buffer);
388							Function: Gather the header section from the scf and parse it into its
389							components.
390							Returns : Reference to a hash containing the header components.
391							Args : The buffer. It is expected that the buffer contains a binary
392							string for the header section of an scf file according to the
393							scf file specifications.
394							Notes : None.
395
396							=cut
397
398							sub _get_header {
399	15			15		25	my ($self,$buffer) = @_;
400	15					18	my $header;
401							($header->{'scf'},
402							$header->{'samples'},
403							$header->{'sample_offset'},
404							$header->{'bases'},
405							$header->{'bases_left_clip'},
406							$header->{'bases_right_clip'},
407							$header->{'bases_offset'},
408							$header->{'comment_size'},
409							$header->{'comments_offset'},
410							$header->{'version'},
411							$header->{'sample_size'},
412							$header->{'code_set'},
413	15					180	@{$header->{'header_spare'}} ) = unpack "a4 NNNNNNNN a4 NN N20", $buffer;
	15					78
414
415	15					48	$self->{'header'} = $header;
416	15					28	return $header;
417							}
418
419							=head2 _parse_v2_bases($buffer)
420
421							Title : _parse_v2_bases($buffer)
422							Usage : $self->_parse_v2_bases($buffer);
423							Function: Gather the bases section from the scf and parse it into its
424							components.
425							Returns :
426							Args : The buffer. It is expected that the buffer contains a binary
427							string for the bases section of an scf file according to the
428							scf file specifications.
429							Notes : None.
430
431							=cut
432
433							sub _parse_v2_bases {
434	4			4		10	my ($self,$buffer) = @_;
435	4					11	my $length = length($buffer);
436	4					6	my ($offset2,$currbuff,$currbase,$currqual,$sequence,@qualities,@indices);
437	0					0	my (@read,$harvester,$accuracies);
438	4					17	for ($offset2=0;$offset2<$length;$offset2+=12) {
439	3734					9866	@read = unpack "N C C C C a C3", substr($buffer,$offset2,$length);
440	3734					3081	push @indices,$read[0];
441	3734					2402	$currbase = lc($read[5]);
442	3734	100				5035	if ($currbase eq "a") { $currqual = $read[1]; }
	828	100				542
		100
		50
443	1238					781	elsif ($currbase eq "c") { $currqual = $read[2]; }
444	710					509	elsif ($currbase eq "g") { $currqual = $read[3]; }
445	958					619	elsif ($currbase eq "t") { $currqual = $read[4]; }
446	0					0	else { $currqual = "UNKNOWN"; }
447	3734					2092	push @{$accuracies->{"a"}},$read[1];
	3734					3204
448	3734					2026	push @{$accuracies->{"c"}},$read[2];
	3734					2797
449	3734					2103	push @{$accuracies->{"g"}},$read[3];
	3734					2686
450	3734					2084	push @{$accuracies->{"t"}},$read[4];
	3734					2561
451
452	3734					2349	$sequence .= $currbase;
453	3734					4909	push @qualities,$currqual;
454							}
455	4					40	return (\@indices,\@qualities,$sequence,$accuracies)
456							}
457
458							=head2 _parse_v2_traces(\@traces_array)
459
460							Title : _pares_v2_traces(\@traces_array)
461							Usage : $self->_parse_v2_traces(\@traces_array);
462							Function: Parses an scf Version2 trace array into its base components.
463							Returns : Nothing. Modifies $self.
464							Args : A reference to an array of the unpacked traces section of an
465							scf version2 file.
466
467							=cut
468
469							sub _parse_v2_traces {
470	4			4		7	my ($self,$buffer,$sample_size) = @_;
471	4					6	my $byte;
472	4	50				8	if ($sample_size == 1) { $byte = "c"; }
	0					0
473	4					6	else { $byte = "n"; }
474	4					4	my $length = CORE::length($buffer);
475	4					12522	my @read = unpack "${byte}${length}",$buffer;
476							# this will be an array to the reference holding the array
477	4					2979	my $traces;
478	4					8	my $array = 0;
479	4					28	for (my $offset2 = 0; $offset2< scalar(@read); $offset2+=4) {
480	46000					24674	push @{$traces->{'a'}},$read[$offset2];
	46000					35098
481	46000					25059	push @{$traces->{'c'}},$read[$offset2+1];
	46000					35564
482	46000					24395	push @{$traces->{'g'}},$read[$offset2+3];
	46000					35081
483	46000					24592	push @{$traces->{'t'}},$read[$offset2+2];
	46000					65203
484							}
485	4					3184	return $traces;
486							}
487
488
489				0	0		sub get_trace_deprecated_use_the_sequencetrace_object_instead {
490							# my ($self,$base_channel,$traces) = @_;
491							# $base_channel =~ tr/a-z/A-Z/;
492							# if ($base_channel !~ /A\|T\|G\|C/) {
493							# $self->throw("You tried to ask for a base channel that wasn't A,T,G, or C. Ask for one of those next time.");
494							##} elsif ($base_channel) {
495							# my @temp = split(' ',$self->{'traces'}->{$base_channel});
496							#return \@temp;
497							#}
498							}
499
500							sub _deprecated_get_peak_indices_deprecated_use_the_sequencetrace_object_instead {
501	0			0		0	my ($self) = shift;
502	0					0	my @temp = split(' ',$self->{'parsed'}->{'peak_indices'});
503	0					0	return \@temp;
504							}
505
506
507							=head2 get_header()
508
509							Title : get_header()
510							Usage : %header = %{$obj->get_header()};
511							Function: Return the header for this scf.
512							Returns : A reference to a hash containing the header for this scf.
513							Args : None.
514							Notes :
515
516							=cut
517
518							sub get_header {
519	1			1	1	556	my ($self) = shift;
520	1					13	return $self->{'header'};
521							}
522
523							=head2 get_comments()
524
525							Title : get_comments()
526							Usage : %comments = %{$obj->get_comments()};
527							Function: Return the comments for this scf.
528							Returns : A Bio::Annotation::Collection object
529							Args : None.
530							Notes :
531
532							=cut
533
534							sub get_comments {
535	1			1	1	2	my ($self) = shift;
536	1					3	return $self->{'comments'};
537							}
538
539							sub _dump_traces_outgoing_deprecated_use_the_sequencetrace_object {
540	0			0		0	my ($self,$transformed) = @_;
541	0					0	my (@sA,@sT,@sG,@sC);
542	0	0				0	if ($transformed) {
543	0					0	@sA = @{$self->{'text'}->{'t_samples_a'}};
	0					0
544	0					0	@sC = @{$self->{'text'}->{'t_samples_c'}};
	0					0
545	0					0	@sG = @{$self->{'text'}->{'t_samples_g'}};
	0					0
546	0					0	@sT = @{$self->{'text'}->{'t_samples_t'}};
	0					0
547							}
548							else {
549	0					0	@sA = @{$self->{'text'}->{'samples_a'}};
	0					0
550	0					0	@sC = @{$self->{'text'}->{'samples_c'}};
	0					0
551	0					0	@sG = @{$self->{'text'}->{'samples_g'}};
	0					0
552	0					0	@sT = @{$self->{'text'}->{'samples_t'}};
	0					0
553							}
554	0					0	print ("Count\ta\tc\tg\tt\n");
555	0					0	for (my $curr=0; $curr < scalar(@sG); $curr++) {
556	0					0	print("$curr\t$sA[$curr]\t$sC[$curr]\t$sG[$curr]\t$sT[$curr]\n");
557							}
558	0					0	return;
559							}
560
561				0			sub _dump_traces_incoming_deprecated_use_the_sequencetrace_object {
562							# my ($self) = @_;
563							# my (@sA,@sT,@sG,@sC);
564							# @sA = @{$self->{'traces'}->{'A'}};
565							# @sC = @{$self->{'traces'}->{'C'}};
566							# @sG = @{$self->{'traces'}->{'G'}};
567							# @sT = @{$self->{'traces'}->{'T'}};
568							# @sA = @{$self->get_trace('A')};
569							# @sC = @{$self->get_trace('C')};
570							# @sG = @{$self->get_trace('G')};
571							# @sT = @{$self->get_trace('t')};
572							# print ("Count\ta\tc\tg\tt\n");
573							# for (my $curr=0; $curr < scalar(@sG); $curr++) {
574							# print("$curr\t$sA[$curr]\t$sC[$curr]\t$sG[$curr]\t$sT[$curr]\n");
575							#}
576							#return;
577							}
578
579							=head2 write_seq
580
581							Title : write_seq(-target => $swq, )
582							Usage : $obj->write_seq(
583							-target => $swq,
584							-version => 2,
585							-CONV => "Bioperl-Chads Mighty SCF writer.");
586							Function: Write out an scf.
587							Returns : Nothing.
588							Args : Requires: a reference to a Bio::Seq::Quality object to form the
589							basis for the scf.
590							if -version is provided, it should be "2" or "3". A SCF of that
591							version will be written.
592							Any other arguments are assumed to be comments and are put into
593							the comments section of the scf. Read the specifications for scf
594							to decide what might be good to put in here.
595
596							Notes :
597							For best results, use a SequenceTrace object.
598							The things that you need to write an scf:
599							a) sequence
600							b) quality
601							c) peak indices
602							d) traces
603							- You _can_ write an scf with just a and b by passing in a
604							Bio::Seq::Quality object- false traces will be synthesized
605							for you.
606
607							=cut
608
609							sub write_seq {
610	10			10	1	3174	my ($self,%args) = @_;
611	10					13	my %comments;
612	10					18	my ($label,$arg);
613	10					47	my ($swq) = $self->_rearrange([qw(TARGET)], %args);
614	10					15	my $writer_fodder;
615	10	50				59	if (ref($swq) =~ /Bio::Seq::SequenceTrace\|Bio::Seq::Quality/) {
616	10	100				31	if (ref($swq) eq "Bio::Seq::Quality") {
617							# this means that the object has no trace data
618							# we might as well synthesize some now, ok?
619	2					13	$swq = Bio::Seq::SequenceTrace->new(
620							-swq => $swq
621							);
622							}
623							}
624							else {
625	0					0	$self->throw("You must pass a Bio::Seq::Quality or a Bio::Seq::SequenceTrace object to write_seq as a parameter named \"target\"");
626							}
627							# all of the rest of the arguments are comments for the scf
628	10					45	foreach $arg (sort keys %args) {
629	23	100				61	next if ($arg =~ /target/i);
630	13					23	($label = $arg) =~ s/^\-//;
631	13					21	$writer_fodder->{comments}->{$label} = $args{$arg};
632							}
633	10	50				31	if (!$comments{'NAME'}) { $comments{'NAME'} = $swq->id(); }
	10					25
634							# HA! Bwahahahaha.
635	10	50				42	$writer_fodder->{comments}->{'CONV'} = "Bioperl-Chads Mighty SCF writer." unless defined $comments{'CONV'};
636							# now deal with the version of scf they want to write
637	10	100				23	if ($writer_fodder->{comments}->{version}) {
638	1	50	33			8	if ($writer_fodder->{comments}->{version} != 2 && $writer_fodder->{comments}->{version} != 3) {
		50
639	0					0	$self->warn("This module can only write version 2.0 or 3.0 scf's. Writing a version 2.0 scf by default.");
640	0					0	$writer_fodder->{header}->{version} = "2.00";
641							}
642							elsif ($writer_fodder->{comments}->{'version'} > 2) {
643	0					0	$writer_fodder->{header}->{'version'} = "3.00";
644							}
645							else {
646	1					3	$writer_fodder->{header}->{version} = "2";
647							}
648							}
649							else {
650	9					21	$writer_fodder->{header}->{'version'} = "3.00";
651							}
652							# set a few things in the header
653	10					21	$writer_fodder->{'header'}->{'magic'} = ".scf";
654	10					11	$writer_fodder->{'header'}->{'sample_size'} = "2";
655	10					25	$writer_fodder->{'header'}->{'bases'} = length($swq->seq());
656	10					19	$writer_fodder->{'header'}->{'bases_left_clip'} = "0";
657	10					15	$writer_fodder->{'header'}->{'bases_right_clip'} = "0";
658	10					14	$writer_fodder->{'header'}->{'sample_size'} = "2";
659	10					15	$writer_fodder->{'header'}->{'code_set'} = "9";
660	10					22	@{$writer_fodder->{'header'}->{'spare'}} = qw(0 0 0 0 0 0 0 0 0 0
	10					65
661							0 0 0 0 0 0 0 0 0 0);
662	10					17	$writer_fodder->{'header'}->{'samples_offset'} = "128";
663	10					35	$writer_fodder->{'header'}->{'samples'} = $swq->trace_length();
664							# create the binary for the comments and file it in writer_fodder
665							$writer_fodder->{comments} = $self->_get_binary_comments(
666	10					31	$writer_fodder->{comments});
667							# create the binary and the strings for the traces, bases,
668							# offsets (if necessary), and accuracies (if necessary)
669							$writer_fodder->{traces} = $self->_get_binary_traces(
670							$writer_fodder->{'header'}->{'version'},
671	10					47	$swq,$writer_fodder->{'header'}->{'sample_size'});
672	10					17	my ($b_base_offsets,$b_base_accuracies,$samples_size,$bases_size);
673							#
674							# version 2
675							#
676	10	100				61	if ($writer_fodder->{'header'}->{'version'} == 2) {
677							$writer_fodder->{bases} = $self->_get_binary_bases(
678							2,
679							$swq,
680	1					6	$writer_fodder->{'header'}->{'sample_size'});
681	1					2	$samples_size = CORE::length($writer_fodder->{traces}->{'binary'});
682	1					3	$bases_size = CORE::length($writer_fodder->{bases}->{binary});
683	1					4	$writer_fodder->{'header'}->{'bases_offset'} = 128 + $samples_size;
684	1					3	$writer_fodder->{'header'}->{'comments_offset'} = 128 +
685							$samples_size + $bases_size;
686							$writer_fodder->{'header'}->{'comments_size'} =
687	1					3	length($writer_fodder->{'comments'}->{binary});
688	1					3	$writer_fodder->{'header'}->{'private_size'} = "0";
689							$writer_fodder->{'header'}->{'private_offset'} = 128 +
690							$samples_size + $bases_size +
691	1					4	$writer_fodder->{'header'}->{'comments_size'};
692							$writer_fodder->{'header'}->{'binary'} =
693	1					5	$self->_get_binary_header($writer_fodder->{header});
694	1	50				8	$dumper->dumpValue($writer_fodder) if $self->verbose > 0;
695	1	50				7	$self->_print ($writer_fodder->{'header'}->{'binary'})
696							or print("Could not write binary header...\n");
697	1	50				4	$self->_print ($writer_fodder->{'traces'}->{'binary'})
698							or print("Could not write binary traces...\n");
699	1	50				5	$self->_print ($writer_fodder->{'bases'}->{'binary'})
700							or print("Could not write binary base structures...\n");
701	1	50				4	$self->_print ($writer_fodder->{'comments'}->{'binary'})
702							or print("Could not write binary comments...\n");
703							}
704							else {
705							($writer_fodder->{peak_indices},
706							$writer_fodder->{accuracies},
707							$writer_fodder->{bases},
708							$writer_fodder->{reserved} ) =
709							$self->_get_binary_bases(
710							3,
711							$swq,
712	9					41	$writer_fodder->{'header'}->{'sample_size'}
713							);
714							$writer_fodder->{'header'}->{'bases_offset'} = 128 +
715	9					24	length($writer_fodder->{'traces'}->{'binary'});
716							$writer_fodder->{'header'}->{'comments_size'} =
717	9					24	length($writer_fodder->{'comments'}->{'binary'});
718							# this is:
719							# bases_offset + base_offsets + accuracies + called_bases +
720							# reserved
721	9					23	$writer_fodder->{'header'}->{'private_size'} = "0";
722
723							$writer_fodder->{'header'}->{'comments_offset'} =
724							128+length($writer_fodder->{'traces'}->{'binary'})+
725							length($writer_fodder->{'peak_indices'}->{'binary'})+
726							length($writer_fodder->{'accuracies'}->{'binary'})+
727							length($writer_fodder->{'bases'}->{'binary'})+
728	9					37	length($writer_fodder->{'reserved'}->{'binary'});
729							$writer_fodder->{'header'}->{'private_offset'} =
730							$writer_fodder->{'header'}->{'comments_offset'} +
731	9					25	$writer_fodder->{'header'}->{'comments_size'};
732							$writer_fodder->{'header'}->{'spare'}->[1] =
733							$writer_fodder->{'header'}->{'comments_offset'} +
734	9					28	length($writer_fodder->{'comments'}->{'binary'});
735							$writer_fodder->{header}->{binary} =
736	9					32	$self->_get_binary_header($writer_fodder->{header});
737	9	50				62	$self->_print ($writer_fodder->{'header'}->{'binary'})
738							or print("Couldn't write header\n");
739	9	50				28	$self->_print ($writer_fodder->{'traces'}->{'binary'})
740							or print("Couldn't write samples\n");
741	9	50				34	$self->_print ($writer_fodder->{'peak_indices'}->{'binary'})
742							or print("Couldn't write peak offsets\n");
743	9	50				30	$self->_print ($writer_fodder->{'accuracies'}->{'binary'})
744							or print("Couldn't write accuracies\n");
745	9	50				29	$self->_print ($writer_fodder->{'bases'}->{'binary'})
746							or print("Couldn't write called_bases\n");
747	9	50				25	$self->_print ($writer_fodder->{'reserved'}->{'binary'})
748							or print("Couldn't write reserved\n");
749	9	50				24	$self->_print ($writer_fodder->{'comments'}->{'binary'})
750							or print ("Couldn't write comments\n");
751							}
752
753							# kinda unnecessary, given the close() below, but maybe that'll go
754							# away someday.
755	10	50	33			36	$self->flush if $self->_flush_on_write && defined $self->_fh;
756
757	10					36	$self->close();
758	10					4763	return 1;
759							}
760
761
762
763
764
765							=head2 _get_binary_header()
766
767							Title : _get_binary_header();
768							Usage : $self->_get_binary_header();
769							Function: Provide the binary string that will be used as the header for
770							a scfv2 document.
771							Returns : A binary string.
772							Args : None. Uses the entries in the $self->{'header'} hash. These
773							are set on construction of the object (hopefully correctly!).
774							Notes :
775
776							=cut
777
778							sub _get_binary_header {
779	10			10		14	my ($self,$header) = @_;
780							my $binary = pack "a4 NNNNNNNN a4 NN N20",
781							(
782							$header->{'magic'},
783							$header->{'samples'},
784							$header->{'samples_offset'},
785							$header->{'bases'},
786							$header->{'bases_left_clip'},
787							$header->{'bases_right_clip'},
788							$header->{'bases_offset'},
789							$header->{'comments_size'},
790							$header->{'comments_offset'},
791							$header->{'version'},
792							$header->{'sample_size'},
793							$header->{'code_set'},
794	10					33	@{$header->{'spare'}}
	10					84
795							);
796	10					51	return $binary;
797							}
798
799							=head2 _get_binary_traces($version,$ref)
800
801							Title : _set_binary_tracesbases($version,$ref)
802							Usage : $self->_set_binary_tracesbases($version,$ref);
803							Function: Constructs the trace and base strings for all scfs
804							Returns : Nothing. Alters self.
805							Args : $version - "2" or "3"
806							$sequence - a scalar containing arbitrary sequence data
807							$ref - a reference to either a SequenceTraces or a
808							SequenceWithQuality object.
809							Notes : This is a really complicated thing.
810
811							=cut
812
813							sub _get_binary_traces {
814	10			10		10	my ($self,$version,$ref,$sample_size) = @_;
815							# ref _should_ be a Bio::Seq::SequenceTrace, but might be a
816							# Bio::Seq::Quality
817	10					11	my $returner;
818	10					20	my $sequence = $ref->seq();
819	10					15	my $sequence_length = length($sequence);
820							# first of all, do we need to synthesize the trace?
821							# if so, call synthesize_base
822	10					13	my ($traceobj,@traces,$current);
823	10	50				22	if ( ref($ref) eq "Bio::Seq::Quality" ) {
824	0					0	$traceobj = Bio::Seq::Quality->new(
825							-target => $ref
826							);
827	0					0	$traceobj->_synthesize_traces();
828							}
829							else {
830	10					10	$traceobj = $ref;
831	10	100				47	if ($version eq "2") {
		50
832	1					3	my $trace_length = $traceobj->trace_length();
833	1					5	for ($current = 1; $current <= $trace_length; $current++) {
834	14107					12803	foreach (qw(a c g t)) {
835	56428					66857	push @traces,$traceobj->trace_value_at($_,$current);
836							}
837							}
838							}
839							elsif ($version == 3) {
840	9					18	foreach my $current_trace (qw(a c g t)) {
841	36					38	my @trace = @{$traceobj->trace($current_trace)};
	36					133
842	36					88	foreach (@trace) {
843	245300	50				262367	if ($_ > 30000) {
844	0					0	$_ -= 65536;
845							}
846							}
847	36					158	my $transformed = $self->_delta(\@trace,"forward");
848	36	50				74	if($sample_size == 1){
849	0					0	foreach (@{$transformed}) {
	0					0
850	0	0				0	$_ += 256 if ($_ < 0);
851							}
852							}
853	36					44	push @traces,@{$transformed};
	36					28371
854							}
855							}
856							}
857	10					62	$returner->{version} = $version;
858	10					34	$returner->{string} = \@traces;
859	10					18	my $length_of_traces = scalar(@traces);
860	10					15	my $byte;
861	10	50				31	if ($sample_size == 1) { $byte = "c"; } else { $byte = "n"; }
	0					0
	10					14
862							# an unsigned integer should be I, but this is too long
863							#
864	10					5984	$returner->{binary} = pack "n${length_of_traces}",@traces;
865	10					27	$returner->{length} = CORE::length($returner->{binary});
866	10					47	return $returner;
867							}
868
869
870							sub _get_binary_bases {
871	10			10		23	my ($self,$version,$trace,$sample_size) = @_;
872	10					11	my $byte;
873	10	50				30	if ($sample_size == 1) { $byte = "c"; } else { $byte = "n"; }
	0					0
	10					12
874	10					18	my ($returner,@current_row,$current_base,$string,$binary);
875	10					45	my $length = $trace->length();
876	10	100				27	if ($version == 2) {
877	1					5	$returner->{'version'} = "2";
878	1					4	for (my $current_base =1; $current_base <= $length; $current_base++) {
879	1106					732	my @current_row;
880	1106					1331	push @current_row,$trace->peak_index_at($current_base);
881	1106					1431	push @current_row,$trace->accuracy_at("a",$current_base);
882	1106					1290	push @current_row,$trace->accuracy_at("c",$current_base);
883	1106					1260	push @current_row,$trace->accuracy_at("g",$current_base);
884	1106					1232	push @current_row,$trace->accuracy_at("t",$current_base);
885	1106					1295	push @current_row,$trace->baseat($current_base);
886	1106					898	push @current_row,0,0,0;
887	1106					618	push @{$returner->{string}},@current_row;
	1106					1739
888	1106					2894	$returner->{binary} .= pack "N C C C C a C3",@current_row;
889							}
890	1					4	return $returner;
891							}
892							else {
893	9					25	$returner->{'version'} = "3.00";
894	9					27	$returner->{peak_indices}->{string} = $trace->peak_indices();
895	9					10	my $length = scalar(@{$returner->{peak_indices}->{string}});
	9					21
896							$returner->{peak_indices}->{binary} =
897	9					21	pack "N$length",@{$returner->{peak_indices}->{string}};
	9					365
898							$returner->{peak_indices}->{length} =
899	9					19	CORE::length($returner->{peak_indices}->{binary});
900	9					15	my @accuracies;
901	9					20	foreach my $base (qw(a c g t)) {
902	36					72	$returner->{accuracies}->{$base} = $trace->accuracies($base);
903	36					34	push @accuracies,@{$trace->accuracies($base)};
	36					60
904							}
905	9					30	$returner->{sequence} = $trace->seq();
906	9					14	$length = scalar(@accuracies);
907							# this really is "c" for samplesize == 2
908	9					302	$returner->{accuracies}->{binary} = pack "C${length}",@accuracies;
909							$returner->{accuracies}->{length} =
910	9					25	CORE::length($returner->{accuracies}->{binary});
911	9					26	$length = $trace->seq_obj()->length();
912	9					33	for (my $count=0; $count< $length; $count++) {
913	4629					2362	push @{$returner->{reserved}->{string}},0,0,0;
	4629					6867
914							}
915							}
916	9					9	$length = scalar(@{$returner->{reserved}->{string}});
	9					18
917							# this _must_ be "c"
918							$returner->{'reserved'}->{'binary'} =
919	9					19	pack "c$length",@{$returner->{reserved}->{string}};
	9					222
920							$returner->{'reserved'}->{'length'} =
921	9					19	CORE::length($returner->{'reserved'}->{'binary'});
922							# $returner->{'bases'}->{'string'} = $trace->seq();
923	9					85	my @bases = split('',$trace->seq());
924	9					25	$length = $trace->length();
925	9					18	$returner->{'bases'}->{'binary'} = $trace->seq();
926							# print("Returning this:\n");
927							# $dumper->dumpValue($returner);
928							return ($returner->{peak_indices},
929							$returner->{accuracies},
930							$returner->{bases},
931	9					211	$returner->{reserved});
932
933							}
934
935
936							=head2 _make_trace_string($version)
937
938							Title : _make_trace_string($version)
939							Usage : $self->_make_trace_string($version)
940							Function: Merges trace data for the four bases to produce an scf
941							trace string. _requires_ $version
942							Returns : Nothing. Alters $self.
943							Args : $version - a version number. "2" or "3"
944							Notes :
945
946							=cut
947
948							sub _make_trace_string {
949	0			0		0	my ($self,$version) = @_;
950	0					0	my @traces;
951							my @traces_view;
952	0					0	my @as = @{$self->{'text'}->{'samples_a'}};
	0					0
953	0					0	my @cs = @{$self->{'text'}->{'samples_c'}};
	0					0
954	0					0	my @gs = @{$self->{'text'}->{'samples_g'}};
	0					0
955	0					0	my @ts = @{$self->{'text'}->{'samples_t'}};
	0					0
956	0	0				0	if ($version == 2) {
		0
957	0					0	for (my $curr=0; $curr < scalar(@as); $curr++) {
958	0	0				0	$as[$curr] = $DEFAULT_QUALITY unless defined $as[$curr];
959	0	0				0	$cs[$curr] = $DEFAULT_QUALITY unless defined $cs[$curr];
960	0	0				0	$gs[$curr] = $DEFAULT_QUALITY unless defined $gs[$curr];
961	0	0				0	$ts[$curr] = $DEFAULT_QUALITY unless defined $ts[$curr];
962	0					0	push @traces,($as[$curr],$cs[$curr],$gs[$curr],$ts[$curr]);
963							}
964							}
965							elsif ($version == 3) {
966	0					0	@traces = (@as,@cs,@gs,@ts);
967							}
968							else {
969	0					0	$self->throw("No idea what version required to make traces here. You gave #$version# Bailing.");
970							}
971	0					0	my $length = scalar(@traces);
972	0					0	$self->{'text'}->{'samples_all'} = \@traces;
973
974							}
975
976							=head2 _get_binary_comments(\@comments)
977
978							Title : _get_binary_comments(\@comments)
979							Usage : $self->_get_binary_comments(\@comments);
980							Function: Provide a binary string that will be the comments section of
981							the scf file. See the scf specifications for detailed
982							specifications for the comments section of an scf file. Hint:
983							CODE=something\nBODE=something\n\0
984							Returns :
985							Args : A reference to an array containing comments.
986							Notes : None.
987
988							=cut
989
990							sub _get_binary_comments {
991	10			10		11	my ($self,$rcomments) = @_;
992	10					13	my $returner;
993	10					11	my $comments_string = '';
994	10					32	my %comments = %$rcomments;
995	10					26	foreach my $key (sort keys %comments) {
996	21		50			33	$comments{$key} \|\|= '';
997	21					49	$comments_string .= "$key=$comments{$key}\n";
998							}
999	10					16	$comments_string .= "\n\0";
1000	10					11	my $length = CORE::length($comments_string);
1001	10					20	$returner->{length} = $length;
1002	10					17	$returner->{string} = $comments_string;
1003	10					62	$returner->{binary} = pack "A$length",$comments_string;
1004	10					29	return $returner;
1005							}
1006
1007							#=head2 _fill_missing_data($swq)
1008							#
1009							# Title : _fill_missing_data($swq)
1010							# Usage : $self->_fill_missing_data($swq);
1011							# Function: If the $swq with quality has no qualities, set all qualities
1012							# to 0.
1013							# If the $swq has no sequence, set the sequence to N's.
1014							# Returns : Nothing. Modifies the Bio::Seq::Quality that was passed as an
1015							# argument.
1016							# Args : A reference to a Bio::Seq::Quality
1017							# Notes : None.
1018							#
1019							#=cut
1020							#
1021							##'
1022							#sub _fill_missing_data {
1023							# my ($self,$swq) = @_;
1024							# my $qual_obj = $swq->qual_obj();
1025							# my $seq_obj = $swq->seq_obj();
1026							# if ($qual_obj->length() == 0 && $seq_obj->length() != 0) {
1027							# my $fake_qualities = ("$DEFAULT_QUALITY ")x$seq_obj->length();
1028							# $swq->qual($fake_qualities);
1029							# }
1030							# if ($seq_obj->length() == 0 && $qual_obj->length != 0) {
1031							# my $sequence = ("N")x$qual_obj->length();
1032							# $swq->seq($sequence);
1033							# }
1034							#}
1035
1036							=head2 _delta(\@trace_data,$direction)
1037
1038							Title : _delta(\@trace_data,$direction)
1039							Usage : $self->_delta(\@trace_data,$direction);
1040							Function:
1041							Returns : A reference to an array containing modified trace values.
1042							Args : A reference to an array containing trace data and a string
1043							indicating the direction of conversion. ("forward" or
1044							"backward").
1045							Notes : This code is taken from the specification for SCF3.2.
1046							http://www.mrc-lmb.cam.ac.uk/pubseq/manual/formats_unix_4.html
1047
1048							=cut
1049
1050
1051							sub _delta {
1052	80			80		146	my ($self,$rsamples,$direction) = @_;
1053	80					30745	my @samples = @$rsamples;
1054							# /* If job == DELTA_IT:
1055							# * change a series of sample points to a series of delta delta values:
1056							# * ie change them in two steps:
1057							# * first: delta = current_value - previous_value
1058							# * then: delta_delta = delta - previous_delta
1059							# * else
1060							# * do the reverse
1061							# */
1062							# int i;
1063							# uint_2 p_delta, p_sample;
1064
1065	80					105	my ($i,$num_samples,$p_delta,$p_sample,@samples_converted,$p_sample1,$p_sample2);
1066	80					84	my $SLOW_BUT_CLEAR = 0;
1067	80					87	$num_samples = scalar(@samples);
1068							# c-programmers are funny people with their single-letter variables
1069
1070	80	100				249	if ( $direction eq "forward" ) {
		50
1071	36	50				49	if($SLOW_BUT_CLEAR){
1072	0					0	$p_delta = 0;
1073	0					0	for ($i=0; $i < $num_samples; $i++) {
1074	0					0	$p_sample = $samples[$i];
1075	0					0	$samples[$i] = $samples[$i] - $p_delta;
1076	0					0	$p_delta = $p_sample;
1077							}
1078	0					0	$p_delta = 0;
1079	0					0	for ($i=0; $i < $num_samples; $i++) {
1080	0					0	$p_sample = $samples[$i];
1081	0					0	$samples[$i] = $samples[$i] - $p_delta;
1082	0					0	$p_delta = $p_sample;
1083							}
1084							} else {
1085	36					102	for ($i = $num_samples-1; $i > 1; $i--){
1086	245228					319407	$samples[$i] = $samples[$i] - 2*$samples[$i-1] + $samples[$i-2];
1087							}
1088	36					54	$samples[1] = $samples[1] - 2*$samples[0];
1089							}
1090							}
1091							elsif ($direction eq "backward") {
1092	44	50				75	if($SLOW_BUT_CLEAR){
1093	0					0	$p_sample = 0;
1094	0					0	for ($i=0; $i < $num_samples; $i++) {
1095	0					0	$samples[$i] = $samples[$i] + $p_sample;
1096	0					0	$p_sample = $samples[$i];
1097							}
1098	0					0	$p_sample = 0;
1099	0					0	for ($i=0; $i < $num_samples; $i++) {
1100	0					0	$samples[$i] = $samples[$i] + $p_sample;
1101	0					0	$p_sample = $samples[$i];
1102							}
1103							} else {
1104	44					51	$p_sample1 = $p_sample2 = 0;
1105	44					95	for ($i = 0; $i < $num_samples; $i++){
1106	424924					246864	$p_sample1 = $p_sample1 + $samples[$i];
1107	424924					247858	$samples[$i] = $p_sample1 + $p_sample2;
1108	424924					468588	$p_sample2 = $samples[$i];
1109							}
1110
1111							}
1112							}
1113							else {
1114	0					0	$self->warn("Bad direction. Use \"forward\" or \"backward\".");
1115							}
1116	80					310	return \@samples;
1117							}
1118
1119							=head2 _unpack_magik($buffer)
1120
1121							Title : _unpack_magik($buffer)
1122							Usage : $self->_unpack_magik($buffer)
1123							Function: What unpack specification should be used? Try them all.
1124							Returns : Nothing.
1125							Args : A buffer containing arbitrary binary data.
1126							Notes : Eliminate the ambiguity and the guesswork. Used in the
1127							adaptation of _delta(), mostly.
1128
1129							=cut
1130
1131							sub _unpack_magik {
1132	0			0		0	my ($self,$buffer) = @_;
1133	0					0	my $length = length($buffer);
1134	0					0	my (@read,$counter);
1135	0					0	foreach (qw(c C s S i I l L n N v V)) {
1136	0					0	@read = unpack "$_$length", $buffer;
1137	0					0	for ($counter=0; $counter < 20; $counter++) {
1138	0					0	print("$read[$counter]\n");
1139							}
1140							}
1141							}
1142
1143							=head2 read_from_buffer($filehandle,$buffer,$length)
1144
1145							Title : read_from_buffer($filehandle,$buffer,$length)
1146							Usage : $self->read_from_buffer($filehandle,$buffer,$length);
1147							Function: Read from the buffer.
1148							Returns : $buffer, containing a read of $length
1149							Args : a filehandle, a buffer, and a read length
1150							Notes : I just got tired of typing
1151							"unless (length($buffer) == $length)" so I put it here.
1152
1153							=cut
1154
1155							sub read_from_buffer {
1156	100			100	1	211	my ($self,$fh,$buffer,$length,$start_position) = @_;
1157							# print("Reading from a buffer!!! length($length) ");
1158	100	100				230	if ($start_position) {
1159							# print(" startposition($start_position)(".sprintf("%X", $start_position).")\n");
1160							}
1161							# print("\n");
1162	100	100				197	if ($start_position) {
1163							# print("seeking to this position in the file: (".$start_position.")\n");
1164	81					324	seek ($fh,$start_position,0);
1165							# print("done. here is where I am now: (".tell($fh).")\n");
1166							}
1167							else {
1168							# print("You did not specify a start position. Going from this position (the current position) (".tell($fh).")\n");
1169							}
1170	100					1725	read $fh, $buffer, $length;
1171	100	50				219	unless (length($buffer) == $length) {
1172	0					0	$self->warn("The read was incomplete! Trying harder.");
1173	0					0	my $missing_length = $length - length($buffer);
1174	0					0	my $buffer2;
1175	0					0	read $fh,$buffer2,$missing_length;
1176	0					0	$buffer .= $buffer2;
1177	0	0				0	if (length($buffer) != $length) {
1178	0					0	$self->throw("Unexpected end of file while reading from SCF file. I should have read $length but instead got ".length($buffer)."! Current file position is ".tell($fh).".");
1179							}
1180							}
1181
1182	100					265	return $buffer;
1183							}
1184
1185							=head2 _dump_keys()
1186
1187							Title : _dump_keys()
1188							Usage : &_dump_keys($a_reference_to_some_hash)
1189							Function: Dump out the keys in a hash.
1190							Returns : Nothing.
1191							Args : A reference to a hash.
1192							Notes : A debugging method.
1193
1194							=cut
1195
1196							sub _dump_keys {
1197	0			0			my $rhash = shift;
1198	0	0					if ($rhash !~ /HASH/) {
1199	0						print("_dump_keys: that was not a hash.\nIt was #$rhash# which was this reference:".ref($rhash)."\n");
1200	0						return;
1201							}
1202	0						print("_dump_keys: The keys for $rhash are:\n");
1203	0						foreach (sort keys %$rhash) {
1204	0						print("$_\n");
1205							}
1206							}
1207
1208							=head2 _dump_base_accuracies()
1209
1210							Title : _dump_base_accuracies()
1211							Usage : $self->_dump_base_accuracies();
1212							Function: Dump out the v3 base accuracies in an easy to read format.
1213							Returns : Nothing.
1214							Args : None.
1215							Notes : A debugging method.
1216
1217							=cut
1218
1219							sub _dump_base_accuracies {
1220	0			0			my $self = shift;
1221	0						print("Dumping base accuracies! for v3\n");
1222	0						print("There are this many elements in a,c,g,t:\n");
1223	0						print(scalar(@{$self->{'text'}->{'v3_base_accuracy_a'}}).",".scalar(@{$self->{'text'}->{'v3_base_accuracy_c'}}).",".scalar(@{$self->{'text'}->{'v3_base_accuracy_g'}}).",".scalar(@{$self->{'text'}->{'v3_base_accuracy_t'}})."\n");
	0
	0
	0
	0
1224	0						my $number_traces = scalar(@{$self->{'text'}->{'v3_base_accuracy_a'}});
	0
1225	0						for (my $counter=0; $counter < $number_traces; $counter++ ) {
1226	0						print("$counter\t");
1227	0						print $self->{'text'}->{'v3_base_accuracy_a'}->[$counter]."\t";
1228	0						print $self->{'text'}->{'v3_base_accuracy_c'}->[$counter]."\t";
1229	0						print $self->{'text'}->{'v3_base_accuracy_g'}->[$counter]."\t";
1230	0						print $self->{'text'}->{'v3_base_accuracy_t'}->[$counter]."\t";
1231	0						print("\n");
1232							}
1233							}
1234
1235							=head2 _dump_peak_indices_incoming()
1236
1237							Title : _dump_peak_indices_incoming()
1238							Usage : $self->_dump_peak_indices_incoming();
1239							Function: Dump out the v3 peak indices in an easy to read format.
1240							Returns : Nothing.
1241							Args : None.
1242							Notes : A debugging method.
1243
1244							=cut
1245
1246							sub _dump_peak_indices_incoming {
1247	0			0			my $self = shift;
1248	0						print("Dump peak indices incoming!\n");
1249	0						my $length = $self->{'bases'};
1250	0						print("The length is $length\n");
1251	0						for (my $count=0; $count < $length; $count++) {
1252	0						print("$count\t$self->{parsed}->{peak_indices}->[$count]\n");
1253							}
1254							}
1255
1256							=head2 _dump_base_accuracies_incoming()
1257
1258							Title : _dump_base_accuracies_incoming()
1259							Usage : $self->_dump_base_accuracies_incoming();
1260							Function: Dump out the v3 base accuracies in an easy to read format.
1261							Returns : Nothing.
1262							Args : None.
1263							Notes : A debugging method.
1264
1265							=cut
1266
1267							sub _dump_base_accuracies_incoming {
1268	0			0			my $self = shift;
1269	0						print("Dumping base accuracies! for v3\n");
1270							# print("There are this many elements in a,c,g,t:\n");
1271							# print(scalar(@{$self->{'parsed'}->{'v3_base_accuracy_a'}}).",".scalar(@{$self->{'text'}->{'v3_base_accuracy_c'}}).",".scalar(@{$self->{'text'}->{'v3_base_accuracy_g'}}).",".scalar(@{$self->{'text'}->{'v3_base_accuracy_t'}})."\n");
1272	0						my $number_traces = $self->{'bases'};
1273	0						for (my $counter=0; $counter < $number_traces; $counter++ ) {
1274	0						print("$counter\t");
1275	0						foreach (qw(A T G C)) {
1276	0						print $self->{'parsed'}->{'base_accuracies'}->{$_}->[$counter]."\t";
1277							}
1278	0						print("\n");
1279							}
1280							}
1281
1282
1283							=head2 _dump_comments()
1284
1285							Title : _dump_comments()
1286							Usage : $self->_dump_comments();
1287							Function: Debug dump the comments section from the scf.
1288							Returns : Nothing.
1289							Args : Nothing.
1290							Notes : None.
1291
1292							=cut
1293
1294							sub _dump_comments {
1295	0			0			my ($self) = @_;
1296	0						warn ("SCF comments:\n");
1297	0						foreach my $k (keys %{$self->{'comments'}}) {
	0
1298	0						warn ("\t {$k} ==> ", $self->{'comments'}->{$k}, "\n");
1299							}
1300							}
1301
1302
1303
1304							1;
1305							__END__