| line |
stmt |
bran |
cond |
sub |
pod |
time |
code |
|
1
|
|
|
|
|
|
|
# |
|
2
|
|
|
|
|
|
|
# BioPerl module for Bio::Tools::Run::Match |
|
3
|
|
|
|
|
|
|
# |
|
4
|
|
|
|
|
|
|
# Please direct questions and support issues to |
|
5
|
|
|
|
|
|
|
# |
|
6
|
|
|
|
|
|
|
# Cared for by Sendu Bala |
|
7
|
|
|
|
|
|
|
# |
|
8
|
|
|
|
|
|
|
# Copyright Sendu Bala |
|
9
|
|
|
|
|
|
|
# |
|
10
|
|
|
|
|
|
|
# You may distribute this module under the same terms as perl itself |
|
11
|
|
|
|
|
|
|
|
|
12
|
|
|
|
|
|
|
# POD documentation - main docs before the code |
|
13
|
|
|
|
|
|
|
|
|
14
|
|
|
|
|
|
|
=head1 NAME |
|
15
|
|
|
|
|
|
|
|
|
16
|
|
|
|
|
|
|
Bio::Tools::Run::Match - Wrapper for Transfac's match(TM) |
|
17
|
|
|
|
|
|
|
|
|
18
|
|
|
|
|
|
|
=head1 SYNOPSIS |
|
19
|
|
|
|
|
|
|
|
|
20
|
|
|
|
|
|
|
use Bio::Tools::Run::Match; |
|
21
|
|
|
|
|
|
|
|
|
22
|
|
|
|
|
|
|
# Make a Match factory |
|
23
|
|
|
|
|
|
|
$factory = Bio::Tools::Run::Match->new(-mxlib => '/path/to/matrix.dat'); |
|
24
|
|
|
|
|
|
|
|
|
25
|
|
|
|
|
|
|
# Run Match on an sequence object |
|
26
|
|
|
|
|
|
|
my @results = $factory->run($bio_seq); |
|
27
|
|
|
|
|
|
|
|
|
28
|
|
|
|
|
|
|
# look at the results |
|
29
|
|
|
|
|
|
|
foreach my $feat (@results) { |
|
30
|
|
|
|
|
|
|
my $seq_id = $feat->seq_id; |
|
31
|
|
|
|
|
|
|
my $start = $feat->start; |
|
32
|
|
|
|
|
|
|
my $end = $feat->end; |
|
33
|
|
|
|
|
|
|
my $score = $feat->score; |
|
34
|
|
|
|
|
|
|
my ($pvalue) = $feat->get_tag_values('pvalue'); |
|
35
|
|
|
|
|
|
|
} |
|
36
|
|
|
|
|
|
|
|
|
37
|
|
|
|
|
|
|
=head1 DESCRIPTION |
|
38
|
|
|
|
|
|
|
|
|
39
|
|
|
|
|
|
|
This is a wrapper for running the match(TM) program supplied with Transfac Pro |
|
40
|
|
|
|
|
|
|
distributions. |
|
41
|
|
|
|
|
|
|
|
|
42
|
|
|
|
|
|
|
You can try supplying normal match command-line arguments to new(), eg. |
|
43
|
|
|
|
|
|
|
new(-b => 1) or calling arg-named methods (excluding the initial |
|
44
|
|
|
|
|
|
|
hyphens, eg. $factory->b(1) to set the -b option to true). |
|
45
|
|
|
|
|
|
|
|
|
46
|
|
|
|
|
|
|
Histogram output isn't supported. -p is supported by using -mxprf, see the |
|
47
|
|
|
|
|
|
|
docs of new() for details. |
|
48
|
|
|
|
|
|
|
|
|
49
|
|
|
|
|
|
|
You will need to enable this match wrapper to find the match executable. |
|
50
|
|
|
|
|
|
|
This can be done in (at least) three ways: |
|
51
|
|
|
|
|
|
|
|
|
52
|
|
|
|
|
|
|
1. Make sure match is in your path. |
|
53
|
|
|
|
|
|
|
2. Define an environmental variable MATCHDIR which is a |
|
54
|
|
|
|
|
|
|
directory which contains the match executable: |
|
55
|
|
|
|
|
|
|
In bash: |
|
56
|
|
|
|
|
|
|
|
|
57
|
|
|
|
|
|
|
export MATCHDIR=/home/username/match/ |
|
58
|
|
|
|
|
|
|
|
|
59
|
|
|
|
|
|
|
In csh/tcsh: |
|
60
|
|
|
|
|
|
|
|
|
61
|
|
|
|
|
|
|
setenv MATCHDIR /home/username/match |
|
62
|
|
|
|
|
|
|
|
|
63
|
|
|
|
|
|
|
3. Include a definition of an environmental variable MATCHDIR in |
|
64
|
|
|
|
|
|
|
every script that will use this match wrapper module, e.g.: |
|
65
|
|
|
|
|
|
|
|
|
66
|
|
|
|
|
|
|
BEGIN { $ENV{MATCHDIR} = '/home/username/match/' } |
|
67
|
|
|
|
|
|
|
use Bio::Tools::Run::Match; |
|
68
|
|
|
|
|
|
|
|
|
69
|
|
|
|
|
|
|
=head1 FEEDBACK |
|
70
|
|
|
|
|
|
|
|
|
71
|
|
|
|
|
|
|
=head2 Mailing Lists |
|
72
|
|
|
|
|
|
|
|
|
73
|
|
|
|
|
|
|
User feedback is an integral part of the evolution of this and other |
|
74
|
|
|
|
|
|
|
Bioperl modules. Send your comments and suggestions preferably to |
|
75
|
|
|
|
|
|
|
the Bioperl mailing list. Your participation is much appreciated. |
|
76
|
|
|
|
|
|
|
|
|
77
|
|
|
|
|
|
|
bioperl-l@bioperl.org - General discussion |
|
78
|
|
|
|
|
|
|
http://bioperl.org/wiki/Mailing_lists - About the mailing lists |
|
79
|
|
|
|
|
|
|
|
|
80
|
|
|
|
|
|
|
=head2 Support |
|
81
|
|
|
|
|
|
|
|
|
82
|
|
|
|
|
|
|
Please direct usage questions or support issues to the mailing list: |
|
83
|
|
|
|
|
|
|
|
|
84
|
|
|
|
|
|
|
I |
|
85
|
|
|
|
|
|
|
|
|
86
|
|
|
|
|
|
|
rather than to the module maintainer directly. Many experienced and |
|
87
|
|
|
|
|
|
|
reponsive experts will be able look at the problem and quickly |
|
88
|
|
|
|
|
|
|
address it. Please include a thorough description of the problem |
|
89
|
|
|
|
|
|
|
with code and data examples if at all possible. |
|
90
|
|
|
|
|
|
|
|
|
91
|
|
|
|
|
|
|
=head2 Reporting Bugs |
|
92
|
|
|
|
|
|
|
|
|
93
|
|
|
|
|
|
|
Report bugs to the Bioperl bug tracking system to help us keep track |
|
94
|
|
|
|
|
|
|
of the bugs and their resolution. Bug reports can be submitted via |
|
95
|
|
|
|
|
|
|
the web: |
|
96
|
|
|
|
|
|
|
|
|
97
|
|
|
|
|
|
|
http://redmine.open-bio.org/projects/bioperl/ |
|
98
|
|
|
|
|
|
|
|
|
99
|
|
|
|
|
|
|
=head1 AUTHOR - Sendu Bala |
|
100
|
|
|
|
|
|
|
|
|
101
|
|
|
|
|
|
|
Email bix@sendu.me.uk |
|
102
|
|
|
|
|
|
|
|
|
103
|
|
|
|
|
|
|
=head1 APPENDIX |
|
104
|
|
|
|
|
|
|
|
|
105
|
|
|
|
|
|
|
The rest of the documentation details each of the object methods. |
|
106
|
|
|
|
|
|
|
Internal methods are usually preceded with a _ |
|
107
|
|
|
|
|
|
|
|
|
108
|
|
|
|
|
|
|
=cut |
|
109
|
|
|
|
|
|
|
|
|
110
|
|
|
|
|
|
|
package Bio::Tools::Run::Match; |
|
111
|
1
|
|
|
1
|
|
107221
|
use strict; |
|
|
1
|
|
|
|
|
1
|
|
|
|
1
|
|
|
|
|
23
|
|
|
112
|
|
|
|
|
|
|
|
|
113
|
1
|
|
|
1
|
|
3
|
use Cwd; |
|
|
1
|
|
|
|
|
1
|
|
|
|
1
|
|
|
|
|
46
|
|
|
114
|
1
|
|
|
1
|
|
3
|
use File::Spec; |
|
|
1
|
|
|
|
|
1
|
|
|
|
1
|
|
|
|
|
20
|
|
|
115
|
1
|
|
|
1
|
|
459
|
use Bio::SeqIO; |
|
|
1
|
|
|
|
|
38306
|
|
|
|
1
|
|
|
|
|
25
|
|
|
116
|
1
|
|
|
1
|
|
164
|
use Bio::FeatureIO; |
|
|
0
|
|
|
|
|
|
|
|
|
0
|
|
|
|
|
|
|
|
117
|
|
|
|
|
|
|
use Bio::Annotation::SimpleValue; |
|
118
|
|
|
|
|
|
|
use Bio::Tools::Match; |
|
119
|
|
|
|
|
|
|
|
|
120
|
|
|
|
|
|
|
use base qw(Bio::Tools::Run::WrapperBase); |
|
121
|
|
|
|
|
|
|
|
|
122
|
|
|
|
|
|
|
our $PROGRAM_NAME = 'match'; |
|
123
|
|
|
|
|
|
|
our $PROGRAM_DIR = $ENV{'MATCHDIR'}; |
|
124
|
|
|
|
|
|
|
|
|
125
|
|
|
|
|
|
|
# methods for the match args we support |
|
126
|
|
|
|
|
|
|
our @PARAMS = qw(mxlib mxprf imcut); # these aren't actually match args, but |
|
127
|
|
|
|
|
|
|
# are methods we use internally |
|
128
|
|
|
|
|
|
|
our @SWITCHES = qw(b u); |
|
129
|
|
|
|
|
|
|
|
|
130
|
|
|
|
|
|
|
# just to be explicit, args we don't support (yet) or we handle ourselves |
|
131
|
|
|
|
|
|
|
our @UNSUPPORTED = qw(H HH pp ppg pn png pr jkn i p); |
|
132
|
|
|
|
|
|
|
|
|
133
|
|
|
|
|
|
|
|
|
134
|
|
|
|
|
|
|
=head2 program_name |
|
135
|
|
|
|
|
|
|
|
|
136
|
|
|
|
|
|
|
Title : program_name |
|
137
|
|
|
|
|
|
|
Usage : $factory>program_name() |
|
138
|
|
|
|
|
|
|
Function: holds the program name |
|
139
|
|
|
|
|
|
|
Returns : string |
|
140
|
|
|
|
|
|
|
Args : None |
|
141
|
|
|
|
|
|
|
|
|
142
|
|
|
|
|
|
|
=cut |
|
143
|
|
|
|
|
|
|
|
|
144
|
|
|
|
|
|
|
sub program_name { |
|
145
|
|
|
|
|
|
|
return $PROGRAM_NAME; |
|
146
|
|
|
|
|
|
|
} |
|
147
|
|
|
|
|
|
|
|
|
148
|
|
|
|
|
|
|
=head2 program_dir |
|
149
|
|
|
|
|
|
|
|
|
150
|
|
|
|
|
|
|
Title : program_dir |
|
151
|
|
|
|
|
|
|
Usage : $factory->program_dir(@params) |
|
152
|
|
|
|
|
|
|
Function: returns the program directory, obtained from ENV variable. |
|
153
|
|
|
|
|
|
|
Returns : string |
|
154
|
|
|
|
|
|
|
Args : None |
|
155
|
|
|
|
|
|
|
|
|
156
|
|
|
|
|
|
|
=cut |
|
157
|
|
|
|
|
|
|
|
|
158
|
|
|
|
|
|
|
sub program_dir { |
|
159
|
|
|
|
|
|
|
return $PROGRAM_DIR; |
|
160
|
|
|
|
|
|
|
} |
|
161
|
|
|
|
|
|
|
|
|
162
|
|
|
|
|
|
|
=head2 new |
|
163
|
|
|
|
|
|
|
|
|
164
|
|
|
|
|
|
|
Title : new |
|
165
|
|
|
|
|
|
|
Usage : $factory = Bio::Tools::Run::Match->new() |
|
166
|
|
|
|
|
|
|
Function: creates a new MCS factory |
|
167
|
|
|
|
|
|
|
Returns : Bio::Tools::Run::MCS |
|
168
|
|
|
|
|
|
|
Args : The following args can either be supplied here or set by calling |
|
169
|
|
|
|
|
|
|
arg-named methods (eg. $factory->imcut(2) ). |
|
170
|
|
|
|
|
|
|
|
|
171
|
|
|
|
|
|
|
-mxlib => path to the matrix.dat file containing Transfac matricies |
|
172
|
|
|
|
|
|
|
-mxprf => path to a profile file | [core_thresh, [matrix_thresh]] |
|
173
|
|
|
|
|
|
|
(defaults to a standard one based on the mxlib provided if |
|
174
|
|
|
|
|
|
|
file not supplied, using core_thresh and matrix_thresh |
|
175
|
|
|
|
|
|
|
values if those are supplied instead) |
|
176
|
|
|
|
|
|
|
-imcut => floating point number, the importance cutoff |
|
177
|
|
|
|
|
|
|
-b | -u => boolean, mutually exclusive |
|
178
|
|
|
|
|
|
|
|
|
179
|
|
|
|
|
|
|
=cut |
|
180
|
|
|
|
|
|
|
|
|
181
|
|
|
|
|
|
|
sub new { |
|
182
|
|
|
|
|
|
|
my ($class, @args) = @_; |
|
183
|
|
|
|
|
|
|
my $self = $class->SUPER::new(@args); |
|
184
|
|
|
|
|
|
|
|
|
185
|
|
|
|
|
|
|
$self->_set_from_args(\@args, -methods => [@PARAMS, @SWITCHES, 'quiet'], |
|
186
|
|
|
|
|
|
|
-create => 1); |
|
187
|
|
|
|
|
|
|
|
|
188
|
|
|
|
|
|
|
return $self; |
|
189
|
|
|
|
|
|
|
} |
|
190
|
|
|
|
|
|
|
|
|
191
|
|
|
|
|
|
|
=head2 run |
|
192
|
|
|
|
|
|
|
|
|
193
|
|
|
|
|
|
|
Title : run |
|
194
|
|
|
|
|
|
|
Usage : $result = $factory->run($bio_seqi_object); |
|
195
|
|
|
|
|
|
|
Function: Runs match on a sequence. |
|
196
|
|
|
|
|
|
|
Returns : list of Bio::SeqFeatureI feature objects |
|
197
|
|
|
|
|
|
|
Args : Bio::SeqI compliant object |
|
198
|
|
|
|
|
|
|
|
|
199
|
|
|
|
|
|
|
NB: mxlib has to have been set prior to calling run(), either as an |
|
200
|
|
|
|
|
|
|
argument to new() or by calling mxlib(). |
|
201
|
|
|
|
|
|
|
|
|
202
|
|
|
|
|
|
|
=cut |
|
203
|
|
|
|
|
|
|
|
|
204
|
|
|
|
|
|
|
sub run { |
|
205
|
|
|
|
|
|
|
my ($self, $seq) = @_; |
|
206
|
|
|
|
|
|
|
$self->mxlib || $self->throw("mxlib has to have been set first"); |
|
207
|
|
|
|
|
|
|
|
|
208
|
|
|
|
|
|
|
return $self->_run($seq); |
|
209
|
|
|
|
|
|
|
} |
|
210
|
|
|
|
|
|
|
|
|
211
|
|
|
|
|
|
|
sub _run { |
|
212
|
|
|
|
|
|
|
my ($self, $seq) = @_; |
|
213
|
|
|
|
|
|
|
|
|
214
|
|
|
|
|
|
|
my $exe = $self->executable || return; |
|
215
|
|
|
|
|
|
|
|
|
216
|
|
|
|
|
|
|
my $mxlib = File::Spec->rel2abs($self->mxlib()); |
|
217
|
|
|
|
|
|
|
my $mxprf_file = $self->mxprf(); |
|
218
|
|
|
|
|
|
|
if ($mxprf_file && -e $mxprf_file) { |
|
219
|
|
|
|
|
|
|
$mxprf_file = File::Spec->rel2abs($mxprf_file); |
|
220
|
|
|
|
|
|
|
} |
|
221
|
|
|
|
|
|
|
|
|
222
|
|
|
|
|
|
|
# cd to a temp dir |
|
223
|
|
|
|
|
|
|
my $temp_dir = $self->tempdir; |
|
224
|
|
|
|
|
|
|
my $cwd = Cwd->cwd(); |
|
225
|
|
|
|
|
|
|
chdir($temp_dir) || $self->throw("Couldn't change to temp dir '$temp_dir'"); |
|
226
|
|
|
|
|
|
|
|
|
227
|
|
|
|
|
|
|
# make the profile file if necessary |
|
228
|
|
|
|
|
|
|
if (! $mxprf_file || ! -e $mxprf_file) { |
|
229
|
|
|
|
|
|
|
my @thresh; |
|
230
|
|
|
|
|
|
|
if ($mxprf_file && ref($mxprf_file) eq 'ARRAY') { |
|
231
|
|
|
|
|
|
|
@thresh = @{$mxprf_file}; |
|
232
|
|
|
|
|
|
|
} |
|
233
|
|
|
|
|
|
|
|
|
234
|
|
|
|
|
|
|
$mxprf_file = 'mxprf'; |
|
235
|
|
|
|
|
|
|
system("$exe $mxlib ignored ignored $mxprf_file -p @thresh") && $self->throw("Something went wrong whist creating profile: $! | $?"); |
|
236
|
|
|
|
|
|
|
} |
|
237
|
|
|
|
|
|
|
|
|
238
|
|
|
|
|
|
|
# output the sequence to a fasta file |
|
239
|
|
|
|
|
|
|
my $seq_file = 'sequence.fa'; |
|
240
|
|
|
|
|
|
|
my $so = Bio::SeqIO->new(-file => ">$seq_file", -format => 'fasta'); |
|
241
|
|
|
|
|
|
|
$so->write_seq($seq); |
|
242
|
|
|
|
|
|
|
$so->close(); |
|
243
|
|
|
|
|
|
|
|
|
244
|
|
|
|
|
|
|
# run match |
|
245
|
|
|
|
|
|
|
my $result_file = 'out'; |
|
246
|
|
|
|
|
|
|
my $param_str = $self->_setparams(); |
|
247
|
|
|
|
|
|
|
my $cmd_line = "$exe $mxlib $seq_file $result_file $mxprf_file".$param_str; |
|
248
|
|
|
|
|
|
|
|
|
249
|
|
|
|
|
|
|
system($cmd_line) && $self->throw("Something went wrong whist running '$cmd_line': $! | $?"); |
|
250
|
|
|
|
|
|
|
|
|
251
|
|
|
|
|
|
|
# parse the results |
|
252
|
|
|
|
|
|
|
my $parser = Bio::Tools::Match->new(-file => $result_file); |
|
253
|
|
|
|
|
|
|
|
|
254
|
|
|
|
|
|
|
# correct the coords |
|
255
|
|
|
|
|
|
|
my @feats; |
|
256
|
|
|
|
|
|
|
while (my $feat = $parser->next_result) { |
|
257
|
|
|
|
|
|
|
push(@feats, $feat); |
|
258
|
|
|
|
|
|
|
} |
|
259
|
|
|
|
|
|
|
|
|
260
|
|
|
|
|
|
|
# cd back again |
|
261
|
|
|
|
|
|
|
chdir($cwd) || $self->throw("Couldn't change back to working directory '$cwd'"); |
|
262
|
|
|
|
|
|
|
|
|
263
|
|
|
|
|
|
|
return @feats; |
|
264
|
|
|
|
|
|
|
} |
|
265
|
|
|
|
|
|
|
|
|
266
|
|
|
|
|
|
|
=head2 _setparams |
|
267
|
|
|
|
|
|
|
|
|
268
|
|
|
|
|
|
|
Title : _setparams |
|
269
|
|
|
|
|
|
|
Usage : Internal function, not to be called directly |
|
270
|
|
|
|
|
|
|
Function: Creates a string of params to be used in the command string |
|
271
|
|
|
|
|
|
|
Returns : string of params |
|
272
|
|
|
|
|
|
|
Args : none |
|
273
|
|
|
|
|
|
|
|
|
274
|
|
|
|
|
|
|
=cut |
|
275
|
|
|
|
|
|
|
|
|
276
|
|
|
|
|
|
|
sub _setparams { |
|
277
|
|
|
|
|
|
|
my $self = shift; |
|
278
|
|
|
|
|
|
|
|
|
279
|
|
|
|
|
|
|
my $param_string = $self->SUPER::_setparams(-switches => \@SWITCHES, |
|
280
|
|
|
|
|
|
|
-dash => 1); |
|
281
|
|
|
|
|
|
|
|
|
282
|
|
|
|
|
|
|
my $null = ($^O =~ m/mswin/i) ? 'NUL' : '/dev/null'; |
|
283
|
|
|
|
|
|
|
$param_string .= " 1>$null" if $self->quiet; |
|
284
|
|
|
|
|
|
|
|
|
285
|
|
|
|
|
|
|
return $param_string; |
|
286
|
|
|
|
|
|
|
} |
|
287
|
|
|
|
|
|
|
|
|
288
|
|
|
|
|
|
|
1; |