File Coverage

Bio/SeqIO/scf.pm

Criterion	Covered	Total	%
statement	371	518	71.6
branch	77	142	54.2
condition	4	14	28.5
subroutine	26	37	70.2
pod	5	6	83.3
total	483	717	67.3

line	stmt	bran	cond	sub	pod	time	code
1							#
2							# Copyright (c) 1997-2001 bioperl, Chad Matsalla. All Rights Reserved.
3							# This module is free software; you can redistribute it and/or
4							# modify it under the same terms as Perl itself.
5							#
6							# Copyright Chad Matsalla
7							#
8							# You may distribute this module under the same terms as perl itself
9
10							# POD documentation - main docs before the code
11
12							=head1 NAME
13
14							Bio::SeqIO::scf - .scf file input/output stream
15
16							=head1 SYNOPSIS
17
18							Do not use this module directly. Use it via the Bio::SeqIO class, see
19							L for more information.
20
21							=head1 DESCRIPTION
22
23							This object can transform .scf files to and from Bio::Seq::SequenceTrace
24							objects. Mechanisms are present to retrieve trace data from scf
25							files.
26
27							=head1 FEEDBACK
28
29							=head2 Mailing Lists
30
31							User feedback is an integral part of the evolution of this and other
32							Bioperl modules. Send your comments and suggestions preferably to one
33							of the Bioperl mailing lists. Your participation is much appreciated.
34
35							bioperl-l@bioperl.org - General discussion
36							http://bioperl.org/wiki/Mailing_lists - About the mailing lists
37
38							=head2 Support
39
40							Please direct usage questions or support issues to the mailing list:
41
42							I
43
44							rather than to the module maintainer directly. Many experienced and
45							reponsive experts will be able look at the problem and quickly
46							address it. Please include a thorough description of the problem
47							with code and data examples if at all possible.
48
49							=head2 Reporting Bugs
50
51							Report bugs to the Bioperl bug tracking system to help us keep track
52							the bugs and their resolution. Bug reports can be submitted via
53							the web:
54
55							https://github.com/bioperl/bioperl-live/issues
56
57							=head1 AUTHOR Chad Matsalla
58
59							Chad Matsalla
60							bioinformatics@dieselwurks.com
61
62							=head1 CONTRIBUTORS
63
64							Jason Stajich, jason@bioperl.org
65							Tony Cox, avc@sanger.ac.uk
66							Heikki Lehvaslaiho, heikki-at-bioperl-dot-org
67							Nancy Hansen, nhansen at mail.nih.gov
68
69							=head1 APPENDIX
70
71							The rest of the documentation details each of the object
72							methods. Internal methods are usually preceded with a _
73
74							=cut
75
76							# Let the code begin...
77
78							package Bio::SeqIO::scf;
79	1			1		542	use vars qw($DEFAULT_QUALITY);
	1					1
	1					40
80	1			1		3	use strict;
	1					1
	1					16
81	1			1		253	use Bio::Seq::SeqFactory;
	1					1
	1					24
82	1			1		359	use Bio::Seq::SequenceTrace;
	1					1
	1					49
83	1			1		352	use Bio::Annotation::Comment;
	1					2
	1					21
84	1			1		5	use Dumpvalue;
	1					1
	1					31
85
86							my $dumper = Dumpvalue->new();
87							$dumper->veryCompact(1);
88
89							BEGIN {
90	1			1		13	$DEFAULT_QUALITY= 10;
91							}
92
93	1			1		3	use base qw(Bio::SeqIO);
	1					2
	1					360
94
95							sub _initialize {
96	25			25		50	my($self,@args) = @_;
97	25					70	$self->SUPER::_initialize(@args);
98	25	50				232	if( ! defined $self->sequence_factory ) {
99	25					87	$self->sequence_factory(Bio::Seq::SeqFactory->new
100							(-verbose => $self->verbose(),
101							-type => 'Bio::Seq::Quality'));
102							}
103	25					69	binmode $self->_fh; # for the Win32/Mac crowds
104							}
105
106							=head2 next_seq()
107
108							Title : next_seq()
109							Usage : $scf = $stream->next_seq()
110							Function: returns the next scf sequence in the stream
111							Returns : a Bio::Seq::SequenceTrace object
112							Args : NONE
113							Notes : Fills the interface specification for SeqIO.
114							The SCF specification does not provide for having more then
115							one sequence in a given scf. So once the filehandle has been open
116							and passed to SeqIO do not expect to run this function more then
117							once on a given scf unless you embraced and extended the SCF
118							standard. SCF comments are accessible through the Bio::SeqI
119							interface method annotation().
120
121							=cut
122
123							#'
124							sub next_seq {
125	15			15	1	69	my ($self) = @_;
126	15					35	my ($seq, $seqc, $fh, $buffer, $offset, $length, $read_bytes, @read,
127							%names);
128							# set up a filehandle to read in the scf
129	15	50				45	return if $self->{_readfile};
130	15					33	$fh = $self->_fh();
131	15	50				40	unless ($fh) { # simulate the <> function
132	0	0	0			0	if ( !fileno(ARGV) or eof(ARGV) ) {
133	0	0				0	return unless my $ARGV = shift;
134	0	0				0	open(ARGV,$ARGV) or
135							$self->throw("Could not open $ARGV for SCF stream reading $!");
136							}
137	0					0	$fh = \*ARGV;
138							}
139	15	50				266	return unless read $fh, $buffer, 128; # no exception; probably end of file
140							# now, the master data structure will be the creator
141	15					26	my $creator;
142							# he first thing to do is parse the header. This is common
143							# among all versions of scf.
144							# the rest of the the information is different between the
145							# the different versions of scf.
146
147	15					57	$creator->{header} = $self->_get_header($buffer);
148	15	100				61	if ($creator->{header}->{'version'} lt "3.00") {
149	4					22	$self->debug("scf.pm is working with a version 2 scf.\n");
150							# first gather the trace information
151							$length = $creator->{header}->{'samples'} *
152	4					11	$creator->{header}->{sample_size}*4;
153							$buffer = $self->read_from_buffer($fh, $buffer, $length,
154	4					20	$creator->{header}->{samples_offset});
155							# @read = unpack "n$length",$buffer;
156							# these traces need to be split
157							# returns a reference to a hash
158							$creator->{traces} = $self->_parse_v2_traces(
159	4					19	$buffer,$creator->{header}->{sample_size});
160							# now go and get the base information
161	4					17	$offset = $creator->{header}->{bases_offset};
162	4					15	$length = ($creator->{header}->{bases} * 12);
163	4					60	seek $fh,$offset,0;
164	4					40	$buffer = $self->read_from_buffer($fh,$buffer,$length,$creator->{header}->{bases_offset});
165							# now distill the information into its fractions.
166							# the old way : $self->_set_v2_bases($buffer);
167							# ref to an array, ref to a hash, string
168							($creator->{peak_indices},
169							$creator->{qualities},
170							$creator->{sequence},
171	4					21	$creator->{accuracies}) = $self->_parse_v2_bases($buffer);
172
173							} else {
174	11					54	$self->debug("scf.pm is working with a version 3+ scf.\n");
175	11					18	my $transformed_read;
176	11					23	my $current_read_position = $creator->{header}->{sample_offset};
177							$length = $creator->{header}->{'samples'}*
178	11					28	$creator->{header}->{sample_size};
179							# $dumper->dumpValue($creator->{header});
180	11					30	foreach (qw(a c g t)) {
181	44					350	$buffer = $self->read_from_buffer($fh,$buffer,$length,$current_read_position);
182	44					87	my $byte = "n";
183	44	50				162	if ($creator->{header}->{sample_size} == 1) {
184	0					0	$byte = "c";
185							}
186	44					33128	@read = unpack "${byte}${length}",$buffer;
187							# this little spurt of nonsense is because
188							# the trace values are given in the binary
189							# file as unsigned shorts but they really
190							# are signed deltas. 30000 is an arbitrary number
191							# (will there be any traces with a given
192							# point greater then 30000? I hope not.
193							# once the read is read, it must be changed
194							# from relative
195	44					6450	foreach (@read) {
196	424924	100				454504	if ($_ > 30000) {
197	142333					97107	$_ -= 65536;
198							}
199							}
200	44					497	$transformed_read = $self->_delta(\@read,"backward");
201							# For 8-bit data we need to emulate a signed/unsigned
202							# cast that is implicit in the C implementations.....
203	44	50				23310	if ($creator->{header}->{sample_size} == 1) {
204	0					0	foreach (@{$transformed_read}) {
	0					0
205	0	0				0	$_ += 256 if ($_ < 0);
206							}
207							}
208	44					71	$current_read_position += $length;
209	44					77	$creator->{'traces'}->{$_} = join(' ',@{$transformed_read});
	44					59013
210							}
211
212							# now go and get the peak index information
213	11					46	$offset = $creator->{header}->{bases_offset};
214	11					36	$length = ($creator->{header}->{bases} * 4);
215	11					89	$buffer = $self->read_from_buffer($fh,$buffer,$length,$offset);
216	11					51	$creator->{peak_indices} = $self->_get_v3_peak_indices($buffer);
217	11					25	$offset += $length;
218							# now go and get the accuracy information
219	11					34	$buffer = $self->read_from_buffer($fh,$buffer,$length,$offset);
220	11					39	$creator->{accuracies} = $self->_get_v3_base_accuracies($buffer);
221							# OK, now go and get the base information.
222	11					26	$offset += $length;
223	11					18	$length = $creator->{header}->{bases};
224	11					28	$buffer = $self->read_from_buffer($fh,$buffer,$length,$offset);
225	11					52	$creator->{'sequence'} = unpack("a$length",$buffer);
226							# now, finally, extract the calls from the accuracy information.
227							$creator->{qualities} = $self->_get_v3_quality(
228	11					47	$creator->{'sequence'},$creator->{accuracies});
229							}
230							# now go and get the comment information
231	15					62	$offset = $creator->{header}->{comments_offset};
232	15					109	seek $fh,$offset,0;
233	15					32	$length = $creator->{header}->{comment_size};
234	15					85	$buffer = $self->read_from_buffer($fh,$buffer,$length);
235	15					63	$creator->{comments} = $self->_get_comments($buffer);
236	74					91	my @name_comments = grep {$_->tagname() eq 'NAME'}
237	15					69	$creator->{comments}->get_Annotations('comment');
238	15					24	my $name_comment;
239	15	100				39	if (@name_comments){
240	7					20	$name_comment = $name_comments[0]->as_text();
241	7					35	$name_comment =~ s/^Comment:\s+//;
242							}
243
244							my $swq = Bio::Seq::Quality->new(
245							-seq => $creator->{'sequence'},
246	15					151	-qual => $creator->{'qualities'},
247							-id => $name_comment
248							);
249							my $returner = Bio::Seq::SequenceTrace->new(
250							-swq => $swq,
251							-trace_a => $creator->{'traces'}->{'a'},
252							-trace_t => $creator->{'traces'}->{'t'},
253							-trace_g => $creator->{'traces'}->{'g'},
254							-trace_c => $creator->{'traces'}->{'c'},
255							-accuracy_a => $creator->{'accuracies'}->{'a'},
256							-accuracy_t => $creator->{'accuracies'}->{'t'},
257							-accuracy_g => $creator->{'accuracies'}->{'g'},
258							-accuracy_c => $creator->{'accuracies'}->{'c'},
259	15					297	-peak_indices => $creator->{'peak_indices'}
260							);
261
262	15					94	$returner->annotation($creator->{'comments'}); # add SCF comments
263	15					31	$self->{'_readfile'} = 1;
264	15					2668	return $returner;
265							}
266
267
268							=head2 _get_v3_quality()
269
270							Title : _get_v3_quality()
271							Usage : $self->_get_v3_quality()
272							Function: Set the base qualities from version3 scf
273							Returns : Nothing. Alters $self.
274							Args : None.
275							Notes :
276
277							=cut
278
279							#'
280							sub _get_v3_quality {
281	11			11		29	my ($self,$sequence,$accuracies) = @_;
282	11					661	my @bases = split//,$sequence;
283	11					11	my (@qualities,$currbase,$currqual,$counter);
284	11					47	for ($counter=0; $counter <= $#bases ; $counter++) {
285	7639					5388	$currbase = lc($bases[$counter]);
286	7639	100				9714	if ($currbase eq "a") { $currqual = $accuracies->{'a'}->[$counter]; }
	1733	100				1375
		100
		50
287	2691					1970	elsif ($currbase eq "c") { $currqual = $accuracies->{'c'}->[$counter]; }
288	1227					970	elsif ($currbase eq "g") { $currqual = $accuracies->{'g'}->[$counter]; }
289	1988					1463	elsif ($currbase eq "t") { $currqual = $accuracies->{'t'}->[$counter]; }
290	0					0	else { $currqual = "unknown"; }
291	7639					9320	push @qualities,$currqual;
292							}
293	11					6432	return \@qualities;
294							}
295
296							=head2 _get_v3_peak_indices($buffer)
297
298							Title : _get_v3_peak_indices($buffer)
299							Usage : $self->_get_v3_peak_indices($buffer);
300							Function: Unpacks the base accuracies for version3 scf
301							Returns : Nothing. Alters $self
302							Args : A scalar containing binary data.
303							Notes :
304
305							=cut
306
307							sub _get_v3_peak_indices {
308	11			11		26	my ($self,$buffer) = @_;
309	11					20	my $length = length($buffer);
310	11					568	my @read = unpack "N$length",$buffer;
311	11					1414	return join(' ',@read);
312							}
313
314							=head2 _get_v3_base_accuracies($buffer)
315
316							Title : _get_v3_base_accuracies($buffer)
317							Usage : $self->_get_v3_base_accuracies($buffer)
318							Function: Set the base accuracies for version 3 scf's
319							Returns : Nothing. Alters $self.
320							Args : A scalar containing binary data.
321							Notes :
322
323							=cut
324
325							#'
326							sub _get_v3_base_accuracies {
327	11			11		16	my ($self,$buffer) = @_;
328	11					22	my $length = length($buffer);
329	11					24	my $qlength = $length/4;
330	11					22	my $offset = 0;
331	11					10	my (@qualities,@sorter,$counter,$round,$last_base,$accuracies,$currbase);
332	11					28	foreach $currbase (qw(a c g t)) {
333	44					31	my @read;
334	44					54	$last_base = $offset + $qlength;
335	44					68	for (;$offset < $last_base; $offset += $qlength) {
336							# a bioperler (perhaps me?) changed the unpack string to include 'n' rather than 'C'
337							# on 040322 I think that 'C' is correct. please email chad if you would like to accuse me of being incorrect
338	44					1529	@read = unpack "C$qlength", substr($buffer,$offset,$qlength);
339	44					616	$accuracies->{$currbase} = \@read;
340							}
341							}
342	11					41	return $accuracies;
343							}
344
345
346							=head2 _get_comments($buffer)
347
348							Title : _get_comments($buffer)
349							Usage : $self->_get_comments($buffer);
350							Function: Gather the comments section from the scf and parse it into its
351							components.
352							Returns : a Bio::Annotation::Collection object
353							Args : The buffer. It is expected that the buffer contains a binary
354							string for the comments section of an scf file according to
355							the scf file specifications.
356							Notes :
357
358							=cut
359
360							sub _get_comments {
361	15			15		59	my ($self,$buffer) = @_;
362	15					254	my $comments = Bio::Annotation::Collection->new();
363	15					33	my $size = length($buffer);
364	15					78	my $comments_retrieved = unpack "a$size",$buffer;
365	15					134	$comments_retrieved =~ s/\0//;
366	15					98	my @comments_split = split/\n/,$comments_retrieved;
367	15	100				41	if (@comments_split) {
368	13					56	foreach (@comments_split) {
369	100					394	/(\w+)=(.*)/;
370	100	100	33			395	if ($1 && $2) {
371	74					113	my ($tagname, $text) = ($1, $2);
372	74					305	my $comment_obj = Bio::Annotation::Comment->new(
373							-text => $text,
374							-tagname => $tagname);
375
376	74					176	$comments->add_Annotation('comment', $comment_obj);
377							}
378							}
379							}
380	15					36	$self->{'comments'} = $comments;
381	15					48	return $comments;
382							}
383
384							=head2 _get_header()
385
386							Title : _get_header($buffer)
387							Usage : $self->_get_header($buffer);
388							Function: Gather the header section from the scf and parse it into its
389							components.
390							Returns : Reference to a hash containing the header components.
391							Args : The buffer. It is expected that the buffer contains a binary
392							string for the header section of an scf file according to the
393							scf file specifications.
394							Notes : None.
395
396							=cut
397
398							sub _get_header {
399	15			15		20	my ($self,$buffer) = @_;
400	15					19	my $header;
401							($header->{'scf'},
402							$header->{'samples'},
403							$header->{'sample_offset'},
404							$header->{'bases'},
405							$header->{'bases_left_clip'},
406							$header->{'bases_right_clip'},
407							$header->{'bases_offset'},
408							$header->{'comment_size'},
409							$header->{'comments_offset'},
410							$header->{'version'},
411							$header->{'sample_size'},
412							$header->{'code_set'},
413	15					194	@{$header->{'header_spare'}} ) = unpack "a4 NNNNNNNN a4 NN N20", $buffer;
	15					82
414
415	15					49	$self->{'header'} = $header;
416	15					29	return $header;
417							}
418
419							=head2 _parse_v2_bases($buffer)
420
421							Title : _parse_v2_bases($buffer)
422							Usage : $self->_parse_v2_bases($buffer);
423							Function: Gather the bases section from the scf and parse it into its
424							components.
425							Returns :
426							Args : The buffer. It is expected that the buffer contains a binary
427							string for the bases section of an scf file according to the
428							scf file specifications.
429							Notes : None.
430
431							=cut
432
433							sub _parse_v2_bases {
434	4			4		8	my ($self,$buffer) = @_;
435	4					7	my $length = length($buffer);
436	4					8	my ($offset2,$currbuff,$currbase,$currqual,$sequence,@qualities,@indices);
437	0					0	my (@read,$harvester,$accuracies);
438	4					16	for ($offset2=0;$offset2<$length;$offset2+=12) {
439	3734					10833	@read = unpack "N C C C C a C3", substr($buffer,$offset2,$length);
440	3734					3250	push @indices,$read[0];
441	3734					2610	$currbase = lc($read[5]);
442	3734	100				5157	if ($currbase eq "a") { $currqual = $read[1]; }
	828	100				581
		100
		50
443	1238					867	elsif ($currbase eq "c") { $currqual = $read[2]; }
444	710					490	elsif ($currbase eq "g") { $currqual = $read[3]; }
445	958					662	elsif ($currbase eq "t") { $currqual = $read[4]; }
446	0					0	else { $currqual = "UNKNOWN"; }
447	3734					2249	push @{$accuracies->{"a"}},$read[1];
	3734					3271
448	3734					2213	push @{$accuracies->{"c"}},$read[2];
	3734					2916
449	3734					2118	push @{$accuracies->{"g"}},$read[3];
	3734					2817
450	3734					2117	push @{$accuracies->{"t"}},$read[4];
	3734					2747
451
452	3734					2486	$sequence .= $currbase;
453	3734					5116	push @qualities,$currqual;
454							}
455	4					56	return (\@indices,\@qualities,$sequence,$accuracies)
456							}
457
458							=head2 _parse_v2_traces(\@traces_array)
459
460							Title : _pares_v2_traces(\@traces_array)
461							Usage : $self->_parse_v2_traces(\@traces_array);
462							Function: Parses an scf Version2 trace array into its base components.
463							Returns : Nothing. Modifies $self.
464							Args : A reference to an array of the unpacked traces section of an
465							scf version2 file.
466
467							=cut
468
469							sub _parse_v2_traces {
470	4			4		7	my ($self,$buffer,$sample_size) = @_;
471	4					5	my $byte;
472	4	50				9	if ($sample_size == 1) { $byte = "c"; }
	0					0
473	4					8	else { $byte = "n"; }
474	4					7	my $length = CORE::length($buffer);
475	4					15497	my @read = unpack "${byte}${length}",$buffer;
476							# this will be an array to the reference holding the array
477	4					3363	my $traces;
478	4					11	my $array = 0;
479	4					53	for (my $offset2 = 0; $offset2< scalar(@read); $offset2+=4) {
480	46000					25935	push @{$traces->{'a'}},$read[$offset2];
	46000					38324
481	46000					26567	push @{$traces->{'c'}},$read[$offset2+1];
	46000					38220
482	46000					24949	push @{$traces->{'g'}},$read[$offset2+3];
	46000					37541
483	46000					26236	push @{$traces->{'t'}},$read[$offset2+2];
	46000					69101
484							}
485	4					3505	return $traces;
486							}
487
488
489				0	0		sub get_trace_deprecated_use_the_sequencetrace_object_instead {
490							# my ($self,$base_channel,$traces) = @_;
491							# $base_channel =~ tr/a-z/A-Z/;
492							# if ($base_channel !~ /A\|T\|G\|C/) {
493							# $self->throw("You tried to ask for a base channel that wasn't A,T,G, or C. Ask for one of those next time.");
494							##} elsif ($base_channel) {
495							# my @temp = split(' ',$self->{'traces'}->{$base_channel});
496							#return \@temp;
497							#}
498							}
499
500							sub _deprecated_get_peak_indices_deprecated_use_the_sequencetrace_object_instead {
501	0			0		0	my ($self) = shift;
502	0					0	my @temp = split(' ',$self->{'parsed'}->{'peak_indices'});
503	0					0	return \@temp;
504							}
505
506
507							=head2 get_header()
508
509							Title : get_header()
510							Usage : %header = %{$obj->get_header()};
511							Function: Return the header for this scf.
512							Returns : A reference to a hash containing the header for this scf.
513							Args : None.
514							Notes :
515
516							=cut
517
518							sub get_header {
519	1			1	1	587	my ($self) = shift;
520	1					14	return $self->{'header'};
521							}
522
523							=head2 get_comments()
524
525							Title : get_comments()
526							Usage : %comments = %{$obj->get_comments()};
527							Function: Return the comments for this scf.
528							Returns : A Bio::Annotation::Collection object
529							Args : None.
530							Notes :
531
532							=cut
533
534							sub get_comments {
535	1			1	1	3	my ($self) = shift;
536	1					3	return $self->{'comments'};
537							}
538
539							sub _dump_traces_outgoing_deprecated_use_the_sequencetrace_object {
540	0			0		0	my ($self,$transformed) = @_;
541	0					0	my (@sA,@sT,@sG,@sC);
542	0	0				0	if ($transformed) {
543	0					0	@sA = @{$self->{'text'}->{'t_samples_a'}};
	0					0
544	0					0	@sC = @{$self->{'text'}->{'t_samples_c'}};
	0					0
545	0					0	@sG = @{$self->{'text'}->{'t_samples_g'}};
	0					0
546	0					0	@sT = @{$self->{'text'}->{'t_samples_t'}};
	0					0
547							}
548							else {
549	0					0	@sA = @{$self->{'text'}->{'samples_a'}};
	0					0
550	0					0	@sC = @{$self->{'text'}->{'samples_c'}};
	0					0
551	0					0	@sG = @{$self->{'text'}->{'samples_g'}};
	0					0
552	0					0	@sT = @{$self->{'text'}->{'samples_t'}};
	0					0
553							}
554	0					0	print ("Count\ta\tc\tg\tt\n");
555	0					0	for (my $curr=0; $curr < scalar(@sG); $curr++) {
556	0					0	print("$curr\t$sA[$curr]\t$sC[$curr]\t$sG[$curr]\t$sT[$curr]\n");
557							}
558	0					0	return;
559							}
560
561				0			sub _dump_traces_incoming_deprecated_use_the_sequencetrace_object {
562							# my ($self) = @_;
563							# my (@sA,@sT,@sG,@sC);
564							# @sA = @{$self->{'traces'}->{'A'}};
565							# @sC = @{$self->{'traces'}->{'C'}};
566							# @sG = @{$self->{'traces'}->{'G'}};
567							# @sT = @{$self->{'traces'}->{'T'}};
568							# @sA = @{$self->get_trace('A')};
569							# @sC = @{$self->get_trace('C')};
570							# @sG = @{$self->get_trace('G')};
571							# @sT = @{$self->get_trace('t')};
572							# print ("Count\ta\tc\tg\tt\n");
573							# for (my $curr=0; $curr < scalar(@sG); $curr++) {
574							# print("$curr\t$sA[$curr]\t$sC[$curr]\t$sG[$curr]\t$sT[$curr]\n");
575							#}
576							#return;
577							}
578
579							=head2 write_seq
580
581							Title : write_seq(-target => $swq, )
582							Usage : $obj->write_seq(
583							-target => $swq,
584							-version => 2,
585							-CONV => "Bioperl-Chads Mighty SCF writer.");
586							Function: Write out an scf.
587							Returns : Nothing.
588							Args : Requires: a reference to a Bio::Seq::Quality object to form the
589							basis for the scf.
590							if -version is provided, it should be "2" or "3". A SCF of that
591							version will be written.
592							Any other arguments are assumed to be comments and are put into
593							the comments section of the scf. Read the specifications for scf
594							to decide what might be good to put in here.
595
596							Notes :
597							For best results, use a SequenceTrace object.
598							The things that you need to write an scf:
599							a) sequence
600							b) quality
601							c) peak indices
602							d) traces
603							- You _can_ write an scf with just a and b by passing in a
604							Bio::Seq::Quality object- false traces will be synthesized
605							for you.
606
607							=cut
608
609							sub write_seq {
610	10			10	1	3525	my ($self,%args) = @_;
611	10					35	my %comments;
612	10					11	my ($label,$arg);
613	10					64	my ($swq) = $self->_rearrange([qw(TARGET)], %args);
614	10					21	my $writer_fodder;
615	10	50				88	if (ref($swq) =~ /Bio::Seq::SequenceTrace\|Bio::Seq::Quality/) {
616	10	100				29	if (ref($swq) eq "Bio::Seq::Quality") {
617							# this means that the object has no trace data
618							# we might as well synthesize some now, ok?
619	2					15	$swq = Bio::Seq::SequenceTrace->new(
620							-swq => $swq
621							);
622							}
623							}
624							else {
625	0					0	$self->throw("You must pass a Bio::Seq::Quality or a Bio::Seq::SequenceTrace object to write_seq as a parameter named \"target\"");
626							}
627							# all of the rest of the arguments are comments for the scf
628	10					50	foreach $arg (sort keys %args) {
629	23	100				69	next if ($arg =~ /target/i);
630	13					25	($label = $arg) =~ s/^\-//;
631	13					23	$writer_fodder->{comments}->{$label} = $args{$arg};
632							}
633	10	50				38	if (!$comments{'NAME'}) { $comments{'NAME'} = $swq->id(); }
	10					35
634							# HA! Bwahahahaha.
635	10	50				47	$writer_fodder->{comments}->{'CONV'} = "Bioperl-Chads Mighty SCF writer." unless defined $comments{'CONV'};
636							# now deal with the version of scf they want to write
637	10	100				24	if ($writer_fodder->{comments}->{version}) {
638	1	50	33			9	if ($writer_fodder->{comments}->{version} != 2 && $writer_fodder->{comments}->{version} != 3) {
		50
639	0					0	$self->warn("This module can only write version 2.0 or 3.0 scf's. Writing a version 2.0 scf by default.");
640	0					0	$writer_fodder->{header}->{version} = "2.00";
641							}
642							elsif ($writer_fodder->{comments}->{'version'} > 2) {
643	0					0	$writer_fodder->{header}->{'version'} = "3.00";
644							}
645							else {
646	1					3	$writer_fodder->{header}->{version} = "2";
647							}
648							}
649							else {
650	9					25	$writer_fodder->{header}->{'version'} = "3.00";
651							}
652							# set a few things in the header
653	10					20	$writer_fodder->{'header'}->{'magic'} = ".scf";
654	10					19	$writer_fodder->{'header'}->{'sample_size'} = "2";
655	10					30	$writer_fodder->{'header'}->{'bases'} = length($swq->seq());
656	10					20	$writer_fodder->{'header'}->{'bases_left_clip'} = "0";
657	10					23	$writer_fodder->{'header'}->{'bases_right_clip'} = "0";
658	10					20	$writer_fodder->{'header'}->{'sample_size'} = "2";
659	10					17	$writer_fodder->{'header'}->{'code_set'} = "9";
660	10					20	@{$writer_fodder->{'header'}->{'spare'}} = qw(0 0 0 0 0 0 0 0 0 0
	10					82
661							0 0 0 0 0 0 0 0 0 0);
662	10					20	$writer_fodder->{'header'}->{'samples_offset'} = "128";
663	10					34	$writer_fodder->{'header'}->{'samples'} = $swq->trace_length();
664							# create the binary for the comments and file it in writer_fodder
665							$writer_fodder->{comments} = $self->_get_binary_comments(
666	10					40	$writer_fodder->{comments});
667							# create the binary and the strings for the traces, bases,
668							# offsets (if necessary), and accuracies (if necessary)
669							$writer_fodder->{traces} = $self->_get_binary_traces(
670							$writer_fodder->{'header'}->{'version'},
671	10					54	$swq,$writer_fodder->{'header'}->{'sample_size'});
672	10					24	my ($b_base_offsets,$b_base_accuracies,$samples_size,$bases_size);
673							#
674							# version 2
675							#
676	10	100				78	if ($writer_fodder->{'header'}->{'version'} == 2) {
677							$writer_fodder->{bases} = $self->_get_binary_bases(
678							2,
679							$swq,
680	1					9	$writer_fodder->{'header'}->{'sample_size'});
681	1					4	$samples_size = CORE::length($writer_fodder->{traces}->{'binary'});
682	1					3	$bases_size = CORE::length($writer_fodder->{bases}->{binary});
683	1					7	$writer_fodder->{'header'}->{'bases_offset'} = 128 + $samples_size;
684	1					4	$writer_fodder->{'header'}->{'comments_offset'} = 128 +
685							$samples_size + $bases_size;
686							$writer_fodder->{'header'}->{'comments_size'} =
687	1					4	length($writer_fodder->{'comments'}->{binary});
688	1					4	$writer_fodder->{'header'}->{'private_size'} = "0";
689							$writer_fodder->{'header'}->{'private_offset'} = 128 +
690							$samples_size + $bases_size +
691	1					6	$writer_fodder->{'header'}->{'comments_size'};
692							$writer_fodder->{'header'}->{'binary'} =
693	1					6	$self->_get_binary_header($writer_fodder->{header});
694	1	50				8	$dumper->dumpValue($writer_fodder) if $self->verbose > 0;
695	1	50				10	$self->_print ($writer_fodder->{'header'}->{'binary'})
696							or print("Could not write binary header...\n");
697	1	50				4	$self->_print ($writer_fodder->{'traces'}->{'binary'})
698							or print("Could not write binary traces...\n");
699	1	50				6	$self->_print ($writer_fodder->{'bases'}->{'binary'})
700							or print("Could not write binary base structures...\n");
701	1	50				5	$self->_print ($writer_fodder->{'comments'}->{'binary'})
702							or print("Could not write binary comments...\n");
703							}
704							else {
705							($writer_fodder->{peak_indices},
706							$writer_fodder->{accuracies},
707							$writer_fodder->{bases},
708							$writer_fodder->{reserved} ) =
709							$self->_get_binary_bases(
710							3,
711							$swq,
712	9					64	$writer_fodder->{'header'}->{'sample_size'}
713							);
714							$writer_fodder->{'header'}->{'bases_offset'} = 128 +
715	9					32	length($writer_fodder->{'traces'}->{'binary'});
716							$writer_fodder->{'header'}->{'comments_size'} =
717	9					31	length($writer_fodder->{'comments'}->{'binary'});
718							# this is:
719							# bases_offset + base_offsets + accuracies + called_bases +
720							# reserved
721	9					28	$writer_fodder->{'header'}->{'private_size'} = "0";
722
723							$writer_fodder->{'header'}->{'comments_offset'} =
724							128+length($writer_fodder->{'traces'}->{'binary'})+
725							length($writer_fodder->{'peak_indices'}->{'binary'})+
726							length($writer_fodder->{'accuracies'}->{'binary'})+
727							length($writer_fodder->{'bases'}->{'binary'})+
728	9					46	length($writer_fodder->{'reserved'}->{'binary'});
729							$writer_fodder->{'header'}->{'private_offset'} =
730							$writer_fodder->{'header'}->{'comments_offset'} +
731	9					20	$writer_fodder->{'header'}->{'comments_size'};
732							$writer_fodder->{'header'}->{'spare'}->[1] =
733							$writer_fodder->{'header'}->{'comments_offset'} +
734	9					23	length($writer_fodder->{'comments'}->{'binary'});
735							$writer_fodder->{header}->{binary} =
736	9					35	$self->_get_binary_header($writer_fodder->{header});
737	9	50				93	$self->_print ($writer_fodder->{'header'}->{'binary'})
738							or print("Couldn't write header\n");
739	9	50				32	$self->_print ($writer_fodder->{'traces'}->{'binary'})
740							or print("Couldn't write samples\n");
741	9	50				41	$self->_print ($writer_fodder->{'peak_indices'}->{'binary'})
742							or print("Couldn't write peak offsets\n");
743	9	50				35	$self->_print ($writer_fodder->{'accuracies'}->{'binary'})
744							or print("Couldn't write accuracies\n");
745	9	50				31	$self->_print ($writer_fodder->{'bases'}->{'binary'})
746							or print("Couldn't write called_bases\n");
747	9	50				30	$self->_print ($writer_fodder->{'reserved'}->{'binary'})
748							or print("Couldn't write reserved\n");
749	9	50				26	$self->_print ($writer_fodder->{'comments'}->{'binary'})
750							or print ("Couldn't write comments\n");
751							}
752
753							# kinda unnecessary, given the close() below, but maybe that'll go
754							# away someday.
755	10	50	33			48	$self->flush if $self->_flush_on_write && defined $self->_fh;
756
757	10					42	$self->close();
758	10					5564	return 1;
759							}
760
761
762
763
764
765							=head2 _get_binary_header()
766
767							Title : _get_binary_header();
768							Usage : $self->_get_binary_header();
769							Function: Provide the binary string that will be used as the header for
770							a scfv2 document.
771							Returns : A binary string.
772							Args : None. Uses the entries in the $self->{'header'} hash. These
773							are set on construction of the object (hopefully correctly!).
774							Notes :
775
776							=cut
777
778							sub _get_binary_header {
779	10			10		19	my ($self,$header) = @_;
780							my $binary = pack "a4 NNNNNNNN a4 NN N20",
781							(
782							$header->{'magic'},
783							$header->{'samples'},
784							$header->{'samples_offset'},
785							$header->{'bases'},
786							$header->{'bases_left_clip'},
787							$header->{'bases_right_clip'},
788							$header->{'bases_offset'},
789							$header->{'comments_size'},
790							$header->{'comments_offset'},
791							$header->{'version'},
792							$header->{'sample_size'},
793							$header->{'code_set'},
794	10					48	@{$header->{'spare'}}
	10					106
795							);
796	10					39	return $binary;
797							}
798
799							=head2 _get_binary_traces($version,$ref)
800
801							Title : _set_binary_tracesbases($version,$ref)
802							Usage : $self->_set_binary_tracesbases($version,$ref);
803							Function: Constructs the trace and base strings for all scfs
804							Returns : Nothing. Alters self.
805							Args : $version - "2" or "3"
806							$sequence - a scalar containing arbitrary sequence data
807							$ref - a reference to either a SequenceTraces or a
808							SequenceWithQuality object.
809							Notes : This is a really complicated thing.
810
811							=cut
812
813							sub _get_binary_traces {
814	10			10		19	my ($self,$version,$ref,$sample_size) = @_;
815							# ref _should_ be a Bio::Seq::SequenceTrace, but might be a
816							# Bio::Seq::Quality
817	10					10	my $returner;
818	10					19	my $sequence = $ref->seq();
819	10					18	my $sequence_length = length($sequence);
820							# first of all, do we need to synthesize the trace?
821							# if so, call synthesize_base
822	10					11	my ($traceobj,@traces,$current);
823	10	50				34	if ( ref($ref) eq "Bio::Seq::Quality" ) {
824	0					0	$traceobj = Bio::Seq::Quality->new(
825							-target => $ref
826							);
827	0					0	$traceobj->_synthesize_traces();
828							}
829							else {
830	10					14	$traceobj = $ref;
831	10	100				66	if ($version eq "2") {
		50
832	1					4	my $trace_length = $traceobj->trace_length();
833	1					4	for ($current = 1; $current <= $trace_length; $current++) {
834	14107					13802	foreach (qw(a c g t)) {
835	56428					76867	push @traces,$traceobj->trace_value_at($_,$current);
836							}
837							}
838							}
839							elsif ($version == 3) {
840	9					24	foreach my $current_trace (qw(a c g t)) {
841	36					54	my @trace = @{$traceobj->trace($current_trace)};
	36					254
842	36					123	foreach (@trace) {
843	245300	50				278375	if ($_ > 30000) {
844	0					0	$_ -= 65536;
845							}
846							}
847	36					285	my $transformed = $self->_delta(\@trace,"forward");
848	36	50				135	if($sample_size == 1){
849	0					0	foreach (@{$transformed}) {
	0					0
850	0	0				0	$_ += 256 if ($_ < 0);
851							}
852							}
853	36					57	push @traces,@{$transformed};
	36					36985
854							}
855							}
856							}
857	10					80	$returner->{version} = $version;
858	10					30	$returner->{string} = \@traces;
859	10					19	my $length_of_traces = scalar(@traces);
860	10					19	my $byte;
861	10	50				34	if ($sample_size == 1) { $byte = "c"; } else { $byte = "n"; }
	0					0
	10					17
862							# an unsigned integer should be I, but this is too long
863							#
864	10					5842	$returner->{binary} = pack "n${length_of_traces}",@traces;
865	10					36	$returner->{length} = CORE::length($returner->{binary});
866	10					60	return $returner;
867							}
868
869
870							sub _get_binary_bases {
871	10			10		25	my ($self,$version,$trace,$sample_size) = @_;
872	10					12	my $byte;
873	10	50				31	if ($sample_size == 1) { $byte = "c"; } else { $byte = "n"; }
	0					0
	10					18
874	10					15	my ($returner,@current_row,$current_base,$string,$binary);
875	10					53	my $length = $trace->length();
876	10	100				23	if ($version == 2) {
877	1					3	$returner->{'version'} = "2";
878	1					7	for (my $current_base =1; $current_base <= $length; $current_base++) {
879	1106					737	my @current_row;
880	1106					1414	push @current_row,$trace->peak_index_at($current_base);
881	1106					1495	push @current_row,$trace->accuracy_at("a",$current_base);
882	1106					1339	push @current_row,$trace->accuracy_at("c",$current_base);
883	1106					1337	push @current_row,$trace->accuracy_at("g",$current_base);
884	1106					1365	push @current_row,$trace->accuracy_at("t",$current_base);
885	1106					1293	push @current_row,$trace->baseat($current_base);
886	1106					934	push @current_row,0,0,0;
887	1106					615	push @{$returner->{string}},@current_row;
	1106					1857
888	1106					3200	$returner->{binary} .= pack "N C C C C a C3",@current_row;
889							}
890	1					8	return $returner;
891							}
892							else {
893	9					30	$returner->{'version'} = "3.00";
894	9					35	$returner->{peak_indices}->{string} = $trace->peak_indices();
895	9					16	my $length = scalar(@{$returner->{peak_indices}->{string}});
	9					20
896							$returner->{peak_indices}->{binary} =
897	9					24	pack "N$length",@{$returner->{peak_indices}->{string}};
	9					348
898							$returner->{peak_indices}->{length} =
899	9					18	CORE::length($returner->{peak_indices}->{binary});
900	9					15	my @accuracies;
901	9					28	foreach my $base (qw(a c g t)) {
902	36					73	$returner->{accuracies}->{$base} = $trace->accuracies($base);
903	36					47	push @accuracies,@{$trace->accuracies($base)};
	36					49
904							}
905	9					34	$returner->{sequence} = $trace->seq();
906	9					16	$length = scalar(@accuracies);
907							# this really is "c" for samplesize == 2
908	9					352	$returner->{accuracies}->{binary} = pack "C${length}",@accuracies;
909							$returner->{accuracies}->{length} =
910	9					21	CORE::length($returner->{accuracies}->{binary});
911	9					28	$length = $trace->seq_obj()->length();
912	9					39	for (my $count=0; $count< $length; $count++) {
913	4629					2396	push @{$returner->{reserved}->{string}},0,0,0;
	4629					7248
914							}
915							}
916	9					19	$length = scalar(@{$returner->{reserved}->{string}});
	9					28
917							# this _must_ be "c"
918							$returner->{'reserved'}->{'binary'} =
919	9					25	pack "c$length",@{$returner->{reserved}->{string}};
	9					274
920							$returner->{'reserved'}->{'length'} =
921	9					29	CORE::length($returner->{'reserved'}->{'binary'});
922							# $returner->{'bases'}->{'string'} = $trace->seq();
923	9					115	my @bases = split('',$trace->seq());
924	9					31	$length = $trace->length();
925	9					24	$returner->{'bases'}->{'binary'} = $trace->seq();
926							# print("Returning this:\n");
927							# $dumper->dumpValue($returner);
928							return ($returner->{peak_indices},
929							$returner->{accuracies},
930							$returner->{bases},
931	9					253	$returner->{reserved});
932
933							}
934
935
936							=head2 _make_trace_string($version)
937
938							Title : _make_trace_string($version)
939							Usage : $self->_make_trace_string($version)
940							Function: Merges trace data for the four bases to produce an scf
941							trace string. _requires_ $version
942							Returns : Nothing. Alters $self.
943							Args : $version - a version number. "2" or "3"
944							Notes :
945
946							=cut
947
948							sub _make_trace_string {
949	0			0		0	my ($self,$version) = @_;
950	0					0	my @traces;
951							my @traces_view;
952	0					0	my @as = @{$self->{'text'}->{'samples_a'}};
	0					0
953	0					0	my @cs = @{$self->{'text'}->{'samples_c'}};
	0					0
954	0					0	my @gs = @{$self->{'text'}->{'samples_g'}};
	0					0
955	0					0	my @ts = @{$self->{'text'}->{'samples_t'}};
	0					0
956	0	0				0	if ($version == 2) {
		0
957	0					0	for (my $curr=0; $curr < scalar(@as); $curr++) {
958	0	0				0	$as[$curr] = $DEFAULT_QUALITY unless defined $as[$curr];
959	0	0				0	$cs[$curr] = $DEFAULT_QUALITY unless defined $cs[$curr];
960	0	0				0	$gs[$curr] = $DEFAULT_QUALITY unless defined $gs[$curr];
961	0	0				0	$ts[$curr] = $DEFAULT_QUALITY unless defined $ts[$curr];
962	0					0	push @traces,($as[$curr],$cs[$curr],$gs[$curr],$ts[$curr]);
963							}
964							}
965							elsif ($version == 3) {
966	0					0	@traces = (@as,@cs,@gs,@ts);
967							}
968							else {
969	0					0	$self->throw("No idea what version required to make traces here. You gave #$version# Bailing.");
970							}
971	0					0	my $length = scalar(@traces);
972	0					0	$self->{'text'}->{'samples_all'} = \@traces;
973
974							}
975
976							=head2 _get_binary_comments(\@comments)
977
978							Title : _get_binary_comments(\@comments)
979							Usage : $self->_get_binary_comments(\@comments);
980							Function: Provide a binary string that will be the comments section of
981							the scf file. See the scf specifications for detailed
982							specifications for the comments section of an scf file. Hint:
983							CODE=something\nBODE=something\n\0
984							Returns :
985							Args : A reference to an array containing comments.
986							Notes : None.
987
988							=cut
989
990							sub _get_binary_comments {
991	10			10		18	my ($self,$rcomments) = @_;
992	10					10	my $returner;
993	10					14	my $comments_string = '';
994	10					45	my %comments = %$rcomments;
995	10					33	foreach my $key (sort keys %comments) {
996	21		50			39	$comments{$key} \|\|= '';
997	21					45	$comments_string .= "$key=$comments{$key}\n";
998							}
999	10					17	$comments_string .= "\n\0";
1000	10					16	my $length = CORE::length($comments_string);
1001	10					24	$returner->{length} = $length;
1002	10					23	$returner->{string} = $comments_string;
1003	10					75	$returner->{binary} = pack "A$length",$comments_string;
1004	10					26	return $returner;
1005							}
1006
1007							#=head2 _fill_missing_data($swq)
1008							#
1009							# Title : _fill_missing_data($swq)
1010							# Usage : $self->_fill_missing_data($swq);
1011							# Function: If the $swq with quality has no qualities, set all qualities
1012							# to 0.
1013							# If the $swq has no sequence, set the sequence to N's.
1014							# Returns : Nothing. Modifies the Bio::Seq::Quality that was passed as an
1015							# argument.
1016							# Args : A reference to a Bio::Seq::Quality
1017							# Notes : None.
1018							#
1019							#=cut
1020							#
1021							##'
1022							#sub _fill_missing_data {
1023							# my ($self,$swq) = @_;
1024							# my $qual_obj = $swq->qual_obj();
1025							# my $seq_obj = $swq->seq_obj();
1026							# if ($qual_obj->length() == 0 && $seq_obj->length() != 0) {
1027							# my $fake_qualities = ("$DEFAULT_QUALITY ")x$seq_obj->length();
1028							# $swq->qual($fake_qualities);
1029							# }
1030							# if ($seq_obj->length() == 0 && $qual_obj->length != 0) {
1031							# my $sequence = ("N")x$qual_obj->length();
1032							# $swq->seq($sequence);
1033							# }
1034							#}
1035
1036							=head2 _delta(\@trace_data,$direction)
1037
1038							Title : _delta(\@trace_data,$direction)
1039							Usage : $self->_delta(\@trace_data,$direction);
1040							Function:
1041							Returns : A reference to an array containing modified trace values.
1042							Args : A reference to an array containing trace data and a string
1043							indicating the direction of conversion. ("forward" or
1044							"backward").
1045							Notes : This code is taken from the specification for SCF3.2.
1046							http://www.mrc-lmb.cam.ac.uk/pubseq/manual/formats_unix_4.html
1047
1048							=cut
1049
1050
1051							sub _delta {
1052	80			80		344	my ($self,$rsamples,$direction) = @_;
1053	80					42508	my @samples = @$rsamples;
1054							# /* If job == DELTA_IT:
1055							# * change a series of sample points to a series of delta delta values:
1056							# * ie change them in two steps:
1057							# * first: delta = current_value - previous_value
1058							# * then: delta_delta = delta - previous_delta
1059							# * else
1060							# * do the reverse
1061							# */
1062							# int i;
1063							# uint_2 p_delta, p_sample;
1064
1065	80					204	my ($i,$num_samples,$p_delta,$p_sample,@samples_converted,$p_sample1,$p_sample2);
1066	80					116	my $SLOW_BUT_CLEAR = 0;
1067	80					133	$num_samples = scalar(@samples);
1068							# c-programmers are funny people with their single-letter variables
1069
1070	80	100				426	if ( $direction eq "forward" ) {
		50
1071	36	50				68	if($SLOW_BUT_CLEAR){
1072	0					0	$p_delta = 0;
1073	0					0	for ($i=0; $i < $num_samples; $i++) {
1074	0					0	$p_sample = $samples[$i];
1075	0					0	$samples[$i] = $samples[$i] - $p_delta;
1076	0					0	$p_delta = $p_sample;
1077							}
1078	0					0	$p_delta = 0;
1079	0					0	for ($i=0; $i < $num_samples; $i++) {
1080	0					0	$p_sample = $samples[$i];
1081	0					0	$samples[$i] = $samples[$i] - $p_delta;
1082	0					0	$p_delta = $p_sample;
1083							}
1084							} else {
1085	36					146	for ($i = $num_samples-1; $i > 1; $i--){
1086	245228					326998	$samples[$i] = $samples[$i] - 2*$samples[$i-1] + $samples[$i-2];
1087							}
1088	36					86	$samples[1] = $samples[1] - 2*$samples[0];
1089							}
1090							}
1091							elsif ($direction eq "backward") {
1092	44	50				130	if($SLOW_BUT_CLEAR){
1093	0					0	$p_sample = 0;
1094	0					0	for ($i=0; $i < $num_samples; $i++) {
1095	0					0	$samples[$i] = $samples[$i] + $p_sample;
1096	0					0	$p_sample = $samples[$i];
1097							}
1098	0					0	$p_sample = 0;
1099	0					0	for ($i=0; $i < $num_samples; $i++) {
1100	0					0	$samples[$i] = $samples[$i] + $p_sample;
1101	0					0	$p_sample = $samples[$i];
1102							}
1103							} else {
1104	44					126	$p_sample1 = $p_sample2 = 0;
1105	44					232	for ($i = 0; $i < $num_samples; $i++){
1106	424924					260843	$p_sample1 = $p_sample1 + $samples[$i];
1107	424924					255264	$samples[$i] = $p_sample1 + $p_sample2;
1108	424924					472578	$p_sample2 = $samples[$i];
1109							}
1110
1111							}
1112							}
1113							else {
1114	0					0	$self->warn("Bad direction. Use \"forward\" or \"backward\".");
1115							}
1116	80					651	return \@samples;
1117							}
1118
1119							=head2 _unpack_magik($buffer)
1120
1121							Title : _unpack_magik($buffer)
1122							Usage : $self->_unpack_magik($buffer)
1123							Function: What unpack specification should be used? Try them all.
1124							Returns : Nothing.
1125							Args : A buffer containing arbitrary binary data.
1126							Notes : Eliminate the ambiguity and the guesswork. Used in the
1127							adaptation of _delta(), mostly.
1128
1129							=cut
1130
1131							sub _unpack_magik {
1132	0			0		0	my ($self,$buffer) = @_;
1133	0					0	my $length = length($buffer);
1134	0					0	my (@read,$counter);
1135	0					0	foreach (qw(c C s S i I l L n N v V)) {
1136	0					0	@read = unpack "$_$length", $buffer;
1137	0					0	for ($counter=0; $counter < 20; $counter++) {
1138	0					0	print("$read[$counter]\n");
1139							}
1140							}
1141							}
1142
1143							=head2 read_from_buffer($filehandle,$buffer,$length)
1144
1145							Title : read_from_buffer($filehandle,$buffer,$length)
1146							Usage : $self->read_from_buffer($filehandle,$buffer,$length);
1147							Function: Read from the buffer.
1148							Returns : $buffer, containing a read of $length
1149							Args : a filehandle, a buffer, and a read length
1150							Notes : I just got tired of typing
1151							"unless (length($buffer) == $length)" so I put it here.
1152
1153							=cut
1154
1155							sub read_from_buffer {
1156	100			100	1	397	my ($self,$fh,$buffer,$length,$start_position) = @_;
1157							# print("Reading from a buffer!!! length($length) ");
1158	100	100				342	if ($start_position) {
1159							# print(" startposition($start_position)(".sprintf("%X", $start_position).")\n");
1160							}
1161							# print("\n");
1162	100	100				267	if ($start_position) {
1163							# print("seeking to this position in the file: (".$start_position.")\n");
1164	81					549	seek ($fh,$start_position,0);
1165							# print("done. here is where I am now: (".tell($fh).")\n");
1166							}
1167							else {
1168							# print("You did not specify a start position. Going from this position (the current position) (".tell($fh).")\n");
1169							}
1170	100					2435	read $fh, $buffer, $length;
1171	100	50				293	unless (length($buffer) == $length) {
1172	0					0	$self->warn("The read was incomplete! Trying harder.");
1173	0					0	my $missing_length = $length - length($buffer);
1174	0					0	my $buffer2;
1175	0					0	read $fh,$buffer2,$missing_length;
1176	0					0	$buffer .= $buffer2;
1177	0	0				0	if (length($buffer) != $length) {
1178	0					0	$self->throw("Unexpected end of file while reading from SCF file. I should have read $length but instead got ".length($buffer)."! Current file position is ".tell($fh).".");
1179							}
1180							}
1181
1182	100					382	return $buffer;
1183							}
1184
1185							=head2 _dump_keys()
1186
1187							Title : _dump_keys()
1188							Usage : &_dump_keys($a_reference_to_some_hash)
1189							Function: Dump out the keys in a hash.
1190							Returns : Nothing.
1191							Args : A reference to a hash.
1192							Notes : A debugging method.
1193
1194							=cut
1195
1196							sub _dump_keys {
1197	0			0			my $rhash = shift;
1198	0	0					if ($rhash !~ /HASH/) {
1199	0						print("_dump_keys: that was not a hash.\nIt was #$rhash# which was this reference:".ref($rhash)."\n");
1200	0						return;
1201							}
1202	0						print("_dump_keys: The keys for $rhash are:\n");
1203	0						foreach (sort keys %$rhash) {
1204	0						print("$_\n");
1205							}
1206							}
1207
1208							=head2 _dump_base_accuracies()
1209
1210							Title : _dump_base_accuracies()
1211							Usage : $self->_dump_base_accuracies();
1212							Function: Dump out the v3 base accuracies in an easy to read format.
1213							Returns : Nothing.
1214							Args : None.
1215							Notes : A debugging method.
1216
1217							=cut
1218
1219							sub _dump_base_accuracies {
1220	0			0			my $self = shift;
1221	0						print("Dumping base accuracies! for v3\n");
1222	0						print("There are this many elements in a,c,g,t:\n");
1223	0						print(scalar(@{$self->{'text'}->{'v3_base_accuracy_a'}}).",".scalar(@{$self->{'text'}->{'v3_base_accuracy_c'}}).",".scalar(@{$self->{'text'}->{'v3_base_accuracy_g'}}).",".scalar(@{$self->{'text'}->{'v3_base_accuracy_t'}})."\n");
	0
	0
	0
	0
1224	0						my $number_traces = scalar(@{$self->{'text'}->{'v3_base_accuracy_a'}});
	0
1225	0						for (my $counter=0; $counter < $number_traces; $counter++ ) {
1226	0						print("$counter\t");
1227	0						print $self->{'text'}->{'v3_base_accuracy_a'}->[$counter]."\t";
1228	0						print $self->{'text'}->{'v3_base_accuracy_c'}->[$counter]."\t";
1229	0						print $self->{'text'}->{'v3_base_accuracy_g'}->[$counter]."\t";
1230	0						print $self->{'text'}->{'v3_base_accuracy_t'}->[$counter]."\t";
1231	0						print("\n");
1232							}
1233							}
1234
1235							=head2 _dump_peak_indices_incoming()
1236
1237							Title : _dump_peak_indices_incoming()
1238							Usage : $self->_dump_peak_indices_incoming();
1239							Function: Dump out the v3 peak indices in an easy to read format.
1240							Returns : Nothing.
1241							Args : None.
1242							Notes : A debugging method.
1243
1244							=cut
1245
1246							sub _dump_peak_indices_incoming {
1247	0			0			my $self = shift;
1248	0						print("Dump peak indices incoming!\n");
1249	0						my $length = $self->{'bases'};
1250	0						print("The length is $length\n");
1251	0						for (my $count=0; $count < $length; $count++) {
1252	0						print("$count\t$self->{parsed}->{peak_indices}->[$count]\n");
1253							}
1254							}
1255
1256							=head2 _dump_base_accuracies_incoming()
1257
1258							Title : _dump_base_accuracies_incoming()
1259							Usage : $self->_dump_base_accuracies_incoming();
1260							Function: Dump out the v3 base accuracies in an easy to read format.
1261							Returns : Nothing.
1262							Args : None.
1263							Notes : A debugging method.
1264
1265							=cut
1266
1267							sub _dump_base_accuracies_incoming {
1268	0			0			my $self = shift;
1269	0						print("Dumping base accuracies! for v3\n");
1270							# print("There are this many elements in a,c,g,t:\n");
1271							# print(scalar(@{$self->{'parsed'}->{'v3_base_accuracy_a'}}).",".scalar(@{$self->{'text'}->{'v3_base_accuracy_c'}}).",".scalar(@{$self->{'text'}->{'v3_base_accuracy_g'}}).",".scalar(@{$self->{'text'}->{'v3_base_accuracy_t'}})."\n");
1272	0						my $number_traces = $self->{'bases'};
1273	0						for (my $counter=0; $counter < $number_traces; $counter++ ) {
1274	0						print("$counter\t");
1275	0						foreach (qw(A T G C)) {
1276	0						print $self->{'parsed'}->{'base_accuracies'}->{$_}->[$counter]."\t";
1277							}
1278	0						print("\n");
1279							}
1280							}
1281
1282
1283							=head2 _dump_comments()
1284
1285							Title : _dump_comments()
1286							Usage : $self->_dump_comments();
1287							Function: Debug dump the comments section from the scf.
1288							Returns : Nothing.
1289							Args : Nothing.
1290							Notes : None.
1291
1292							=cut
1293
1294							sub _dump_comments {
1295	0			0			my ($self) = @_;
1296	0						warn ("SCF comments:\n");
1297	0						foreach my $k (keys %{$self->{'comments'}}) {
	0
1298	0						warn ("\t {$k} ==> ", $self->{'comments'}->{$k}, "\n");
1299							}
1300							}
1301
1302
1303
1304							1;
1305							__END__