line |
stmt |
bran |
cond |
sub |
pod |
time |
code |
1
|
|
|
|
|
|
|
|
2
|
|
|
|
|
|
|
=pod |
3
|
|
|
|
|
|
|
|
4
|
|
|
|
|
|
|
=head1 NAME |
5
|
|
|
|
|
|
|
|
6
|
|
|
|
|
|
|
Set::IntSpan::Island - extension for Set::IntSpan to handle islands, holes and covers |
7
|
|
|
|
|
|
|
|
8
|
|
|
|
|
|
|
=head1 SYNOPSIS |
9
|
|
|
|
|
|
|
|
10
|
|
|
|
|
|
|
use Set::IntSpan::Island; |
11
|
|
|
|
|
|
|
|
12
|
|
|
|
|
|
|
# inherits normal behaviour from Set::IntSpan |
13
|
|
|
|
|
|
|
$set = Set::IntSpan::Island->new( $set_spec ); |
14
|
|
|
|
|
|
|
# special pair input creates a span a-b |
15
|
|
|
|
|
|
|
$set = Set::IntSpan::Island->new( $a,$b ); |
16
|
|
|
|
|
|
|
|
17
|
|
|
|
|
|
|
# equivalent to $set->cardinality($another_set)->size; |
18
|
|
|
|
|
|
|
if ($set->overlap( $another_set )) { ... } |
19
|
|
|
|
|
|
|
|
20
|
|
|
|
|
|
|
# distance between spans is negative if spans overlap, positive if not |
21
|
|
|
|
|
|
|
$distance = $set->distance( $another_set ); |
22
|
|
|
|
|
|
|
|
23
|
|
|
|
|
|
|
# remove islands whose size is smaller than $minsize |
24
|
|
|
|
|
|
|
$new_set = $set->excise( $minsize ); |
25
|
|
|
|
|
|
|
|
26
|
|
|
|
|
|
|
# remove islands whose size is found in the set $sizes_set, |
27
|
|
|
|
|
|
|
$new_set = $set->excise( $sizes_set ); |
28
|
|
|
|
|
|
|
# all islands sized <= 10 removed |
29
|
|
|
|
|
|
|
$new_set = $set->excise( Set::IntSpan( "(-10" ) ); |
30
|
|
|
|
|
|
|
# all islands sized >= 10 removed |
31
|
|
|
|
|
|
|
$new_set = $set->excise( Set::IntSpan( "10-)" ) ); |
32
|
|
|
|
|
|
|
# all islands of size between 2-5 removed |
33
|
|
|
|
|
|
|
$new_set = $set->excise( Set::IntSpan( "2-5" ) ); |
34
|
|
|
|
|
|
|
|
35
|
|
|
|
|
|
|
# remove islands larger than $maxlength |
36
|
|
|
|
|
|
|
$set = $set->excise_large( $minlength ); |
37
|
|
|
|
|
|
|
|
38
|
|
|
|
|
|
|
# fill holes up to $maxsize |
39
|
|
|
|
|
|
|
$set = $set->fill( $maxsize ); |
40
|
|
|
|
|
|
|
|
41
|
|
|
|
|
|
|
# fill holes whose size is found in the set $sizes_set |
42
|
|
|
|
|
|
|
$set = $set->fill( $sizes_set); |
43
|
|
|
|
|
|
|
# all holes sizes <= 10 filled |
44
|
|
|
|
|
|
|
$set = $set->fill( Set::IntSpan( "(-10" ) ); |
45
|
|
|
|
|
|
|
# all holes sizes >= 10 filled |
46
|
|
|
|
|
|
|
$set = $set->fill( Set::IntSpan( "10-)" ) ); |
47
|
|
|
|
|
|
|
# all holes sizes 2-5 filled |
48
|
|
|
|
|
|
|
$set = $set->fill( Set::IntSpan( "2-5" ) ); |
49
|
|
|
|
|
|
|
|
50
|
|
|
|
|
|
|
# return a set composed of islands of $set that overlap $another_set |
51
|
|
|
|
|
|
|
$set = $set->find_island( $another_set ); |
52
|
|
|
|
|
|
|
|
53
|
|
|
|
|
|
|
# return a set composed of the nearest non-overlapping island(s) to $another_set |
54
|
|
|
|
|
|
|
$set = $set->nearest_island( $another_set ); |
55
|
|
|
|
|
|
|
|
56
|
|
|
|
|
|
|
# construct a list of covers by exhaustively intersecting all sets |
57
|
|
|
|
|
|
|
@covers = Set::IntSpan::Island->extract_covers( { id1=>$set1, id2=>set2, ... } ); |
58
|
|
|
|
|
|
|
for $cover (@covers) { |
59
|
|
|
|
|
|
|
($coverset,@ids) = ($cover->[0], @{$cover->[1]}); |
60
|
|
|
|
|
|
|
print "cover",$coverset->run_list,"contains sets",join(",",@ids); |
61
|
|
|
|
|
|
|
} |
62
|
|
|
|
|
|
|
|
63
|
|
|
|
|
|
|
=head1 DESCRIPTION |
64
|
|
|
|
|
|
|
|
65
|
|
|
|
|
|
|
This module extends the C module by Steve McDougall. It |
66
|
|
|
|
|
|
|
implementing methods that are specific to islands, holes and |
67
|
|
|
|
|
|
|
covers. C inherits from Set::IntSpan. |
68
|
|
|
|
|
|
|
|
69
|
|
|
|
|
|
|
=head2 Terminology |
70
|
|
|
|
|
|
|
|
71
|
|
|
|
|
|
|
An integer set, as represented by C, is a collection of |
72
|
|
|
|
|
|
|
islands (or spans) on the number line |
73
|
|
|
|
|
|
|
|
74
|
|
|
|
|
|
|
...-----xxxx----xxxxxxxx---xxxxxxxx---xx---x----.... |
75
|
|
|
|
|
|
|
|
76
|
|
|
|
|
|
|
Holes are regions not in the set that fall between adjacent spans. For |
77
|
|
|
|
|
|
|
example, the integer set above is composed of 5 islands and 4 |
78
|
|
|
|
|
|
|
holes. The two infinite regions on either side of the set are not |
79
|
|
|
|
|
|
|
counted as holes within the context of this module. |
80
|
|
|
|
|
|
|
|
81
|
|
|
|
|
|
|
=head1 METHODS |
82
|
|
|
|
|
|
|
|
83
|
|
|
|
|
|
|
=cut |
84
|
|
|
|
|
|
|
|
85
|
|
|
|
|
|
|
package Set::IntSpan::Island; |
86
|
|
|
|
|
|
|
|
87
|
15
|
|
|
15
|
|
368147
|
use 5; |
|
15
|
|
|
|
|
58
|
|
|
15
|
|
|
|
|
698
|
|
88
|
15
|
|
|
15
|
|
88
|
use strict; |
|
15
|
|
|
|
|
31
|
|
|
15
|
|
|
|
|
697
|
|
89
|
15
|
|
|
15
|
|
78
|
use warnings FATAL=>"all"; |
|
15
|
|
|
|
|
23
|
|
|
15
|
|
|
|
|
4008
|
|
90
|
|
|
|
|
|
|
|
91
|
15
|
|
|
15
|
|
14801
|
use parent qw(Exporter); |
|
15
|
|
|
|
|
5286
|
|
|
15
|
|
|
|
|
82
|
|
92
|
15
|
|
|
15
|
|
779
|
use parent qw(Set::IntSpan); |
|
15
|
|
|
|
|
29
|
|
|
15
|
|
|
|
|
61
|
|
93
|
|
|
|
|
|
|
|
94
|
|
|
|
|
|
|
our @EXPORT = qw(); |
95
|
|
|
|
|
|
|
our @EXPORT_OK = qw(); |
96
|
|
|
|
|
|
|
|
97
|
15
|
|
|
15
|
|
228985
|
use Set::IntSpan 1.13; |
|
15
|
|
|
|
|
472
|
|
|
15
|
|
|
|
|
800
|
|
98
|
15
|
|
|
15
|
|
86
|
use Carp; |
|
15
|
|
|
|
|
33
|
|
|
15
|
|
|
|
|
40404
|
|
99
|
|
|
|
|
|
|
|
100
|
|
|
|
|
|
|
our $VERSION = '0.10'; |
101
|
|
|
|
|
|
|
|
102
|
|
|
|
|
|
|
=pod |
103
|
|
|
|
|
|
|
|
104
|
|
|
|
|
|
|
=head2 $set = Set::IntSpan::Island->new( $set_spec ) |
105
|
|
|
|
|
|
|
|
106
|
|
|
|
|
|
|
Constructs a set using the set specification as supported by C. |
107
|
|
|
|
|
|
|
|
108
|
|
|
|
|
|
|
=head2 $set = Set::IntSpan::Island->new( $a, $b ) |
109
|
|
|
|
|
|
|
|
110
|
|
|
|
|
|
|
Extension to C C method, this double-argument |
111
|
|
|
|
|
|
|
version creates a set formed by the range a-b. This is equivalent to |
112
|
|
|
|
|
|
|
|
113
|
|
|
|
|
|
|
$set = Set::IntSpan::Island->new("$a-$b") |
114
|
|
|
|
|
|
|
|
115
|
|
|
|
|
|
|
but permits initialization from a list instead of a string. The |
116
|
|
|
|
|
|
|
arguments $a and $b are expected to be integers - any decimal |
117
|
|
|
|
|
|
|
component will be truncated. |
118
|
|
|
|
|
|
|
|
119
|
|
|
|
|
|
|
new(1.2,2.9) equivalent to new(1,2) |
120
|
|
|
|
|
|
|
|
121
|
|
|
|
|
|
|
=cut |
122
|
|
|
|
|
|
|
|
123
|
|
|
|
|
|
|
sub new { |
124
|
472359
|
|
|
472359
|
1
|
14296282
|
my ($this, @args) = @_; |
125
|
472359
|
|
66
|
|
|
1107576
|
my $class = ref($this) || $this; |
126
|
472359
|
|
|
|
|
529566
|
my $self; |
127
|
472359
|
100
|
|
|
|
848463
|
if(@args <= 1) { |
|
|
50
|
|
|
|
|
|
128
|
|
|
|
|
|
|
# relegate to parent |
129
|
450683
|
|
|
|
|
1311611
|
$self = $class->SUPER::new(@args); |
130
|
|
|
|
|
|
|
} elsif (@args==2) { |
131
|
|
|
|
|
|
|
# treat as request to create span x-y |
132
|
21676
|
|
|
|
|
35529
|
my ($x,$y) = map {int($_)} @args; |
|
43352
|
|
|
|
|
96775
|
|
133
|
21676
|
100
|
|
|
|
50114
|
if($x == $y) { |
134
|
1252
|
|
|
|
|
4330
|
$self = $class->SUPER::new($x); |
135
|
|
|
|
|
|
|
} else { |
136
|
20424
|
|
|
|
|
106908
|
$self = $class->SUPER::new("$x-$y"); |
137
|
|
|
|
|
|
|
} |
138
|
|
|
|
|
|
|
} else { |
139
|
0
|
|
|
|
|
0
|
confess "Set::IntSpan::Island: cannot create object using more than two integers [@args]"; |
140
|
|
|
|
|
|
|
} |
141
|
472359
|
|
|
|
|
14494031
|
return $self; |
142
|
|
|
|
|
|
|
} |
143
|
|
|
|
|
|
|
|
144
|
|
|
|
|
|
|
=pod |
145
|
|
|
|
|
|
|
|
146
|
|
|
|
|
|
|
=head2 $set_copy = $set->clone() |
147
|
|
|
|
|
|
|
|
148
|
|
|
|
|
|
|
Creates a copy of C<$set>. Also accessible using C<$set->duplicate()>; |
149
|
|
|
|
|
|
|
|
150
|
|
|
|
|
|
|
=head2 $set_copy = $set->duplicate() |
151
|
|
|
|
|
|
|
|
152
|
|
|
|
|
|
|
Same as C. |
153
|
|
|
|
|
|
|
|
154
|
|
|
|
|
|
|
=cut |
155
|
|
|
|
|
|
|
|
156
|
|
|
|
|
|
|
sub duplicate { |
157
|
21
|
|
|
21
|
1
|
40
|
my $self = shift; |
158
|
21
|
|
|
|
|
64
|
return $self->new($self->run_list); |
159
|
|
|
|
|
|
|
} |
160
|
|
|
|
|
|
|
|
161
|
|
|
|
|
|
|
sub clone { |
162
|
7
|
|
|
7
|
1
|
27
|
my $self = shift; |
163
|
7
|
|
|
|
|
20
|
return $self->new($self->run_list); |
164
|
|
|
|
|
|
|
} |
165
|
|
|
|
|
|
|
|
166
|
|
|
|
|
|
|
=pod |
167
|
|
|
|
|
|
|
|
168
|
|
|
|
|
|
|
=head2 $olap = $set->overlap( $another_set ); |
169
|
|
|
|
|
|
|
|
170
|
|
|
|
|
|
|
Returns the size of intersection of two sets. Equivalent to |
171
|
|
|
|
|
|
|
|
172
|
|
|
|
|
|
|
$set->intersect( $another_set )->size; |
173
|
|
|
|
|
|
|
|
174
|
|
|
|
|
|
|
The returned value is either 0 (if the sets do not overlap) or positive (if they do). |
175
|
|
|
|
|
|
|
|
176
|
|
|
|
|
|
|
=cut |
177
|
|
|
|
|
|
|
|
178
|
|
|
|
|
|
|
sub overlap { |
179
|
240702
|
|
|
240702
|
1
|
295955
|
my ($self,$set) = @_; |
180
|
240702
|
|
|
|
|
583698
|
return $self->intersect($set)->size; |
181
|
|
|
|
|
|
|
} |
182
|
|
|
|
|
|
|
|
183
|
|
|
|
|
|
|
=pod |
184
|
|
|
|
|
|
|
|
185
|
|
|
|
|
|
|
=head2 $d = $set->distance( $another_set ) |
186
|
|
|
|
|
|
|
|
187
|
|
|
|
|
|
|
Returns the distance between sets, measured as follows. If the sets |
188
|
|
|
|
|
|
|
overlap, then the distance is negative and given by |
189
|
|
|
|
|
|
|
|
190
|
|
|
|
|
|
|
$d = -$set->overlap( $another_set ) |
191
|
|
|
|
|
|
|
|
192
|
|
|
|
|
|
|
If the sets abut, C<$d> is 1. Here $d can be interpreted as the |
193
|
|
|
|
|
|
|
difference between the closest edges of the two sets. |
194
|
|
|
|
|
|
|
|
195
|
|
|
|
|
|
|
The above generalizes to 1+size(hole) if the sets do not overlap and |
196
|
|
|
|
|
|
|
are composed of multiple islands. The hole used is the one between two |
197
|
|
|
|
|
|
|
closest islands of the sets. |
198
|
|
|
|
|
|
|
|
199
|
|
|
|
|
|
|
Returns C if C<$another_set> is not defined, or either C<$set> |
200
|
|
|
|
|
|
|
or C<$another_set> is empty. |
201
|
|
|
|
|
|
|
|
202
|
|
|
|
|
|
|
Here are some examples of how the distance is calculated. |
203
|
|
|
|
|
|
|
|
204
|
|
|
|
|
|
|
A ----xxxx---xxx-----xx-- |
205
|
|
|
|
|
|
|
B ------xxx------xx--x--- |
206
|
|
|
|
|
|
|
!! ! d=-3 |
207
|
|
|
|
|
|
|
|
208
|
|
|
|
|
|
|
A ----xxxx---xxx-----xx-- |
209
|
|
|
|
|
|
|
B ----xxxx---xxx--------- |
210
|
|
|
|
|
|
|
!!!! !!! d=-7 |
211
|
|
|
|
|
|
|
|
212
|
|
|
|
|
|
|
A ----xxxx---xxx-----xx-- |
213
|
|
|
|
|
|
|
B --------------x-------- |
214
|
|
|
|
|
|
|
>< d=1 |
215
|
|
|
|
|
|
|
|
216
|
|
|
|
|
|
|
A ----xxxx---xxx-----xx-- |
217
|
|
|
|
|
|
|
B ---------------x------- |
218
|
|
|
|
|
|
|
> < d=2 |
219
|
|
|
|
|
|
|
|
220
|
|
|
|
|
|
|
A ----xxxx---xxx-----xx-- |
221
|
|
|
|
|
|
|
B ---------------xx------ |
222
|
|
|
|
|
|
|
> < d=2 |
223
|
|
|
|
|
|
|
|
224
|
|
|
|
|
|
|
A ----xxxx---xxx-----xx-- |
225
|
|
|
|
|
|
|
B ---------------xxxx---- |
226
|
|
|
|
|
|
|
>< d=1 |
227
|
|
|
|
|
|
|
|
228
|
|
|
|
|
|
|
=cut |
229
|
|
|
|
|
|
|
|
230
|
|
|
|
|
|
|
sub distance { |
231
|
55
|
|
|
55
|
1
|
119
|
my ($set1,$set2) = @_; |
232
|
55
|
100
|
100
|
|
|
133
|
return undef unless $set1 && $set2; |
233
|
52
|
50
|
33
|
|
|
1473
|
return undef unless $set1->cardinality && $set2->cardinality; |
234
|
52
|
|
|
|
|
1257
|
my $overlap = $set1->overlap($set2); |
235
|
52
|
100
|
|
|
|
1556
|
if($overlap) { |
236
|
5
|
|
|
|
|
13
|
return -$overlap; |
237
|
|
|
|
|
|
|
} else { |
238
|
47
|
|
|
|
|
51
|
my $min_d; |
239
|
47
|
|
|
|
|
82
|
for my $span1 ($set1->sets) { |
240
|
64
|
|
|
|
|
123
|
for my $span2 ($set2->sets) { |
241
|
64
|
|
|
|
|
1202
|
my $d1 = abs($span1->min - $span2->max); |
242
|
64
|
|
|
|
|
1166
|
my $d2 = abs($span1->max - $span2->min); |
243
|
64
|
100
|
|
|
|
1030
|
my $d = $d1 < $d2 ? $d1 : $d2; |
244
|
64
|
100
|
100
|
|
|
233
|
if(! defined $min_d || $d < $min_d) { |
245
|
53
|
|
|
|
|
222
|
$min_d = $d; |
246
|
|
|
|
|
|
|
} |
247
|
|
|
|
|
|
|
} |
248
|
|
|
|
|
|
|
} |
249
|
47
|
|
|
|
|
182
|
return $min_d; |
250
|
|
|
|
|
|
|
} |
251
|
|
|
|
|
|
|
} |
252
|
|
|
|
|
|
|
|
253
|
|
|
|
|
|
|
=head2 $d = $set->sets() |
254
|
|
|
|
|
|
|
|
255
|
|
|
|
|
|
|
Returns all spans in $set as C objects. This method overrides the C method in C in order to return sets as Set::IntSpan::Island objects. |
256
|
|
|
|
|
|
|
|
257
|
|
|
|
|
|
|
=cut |
258
|
|
|
|
|
|
|
|
259
|
|
|
|
|
|
|
sub sets { |
260
|
15090
|
|
|
15090
|
1
|
714768
|
my $set = shift; |
261
|
15090
|
|
|
|
|
47441
|
return map { $set->new($_->run_list) } $set->SUPER::sets(); |
|
64750
|
|
|
|
|
3587683
|
|
262
|
|
|
|
|
|
|
} |
263
|
|
|
|
|
|
|
|
264
|
|
|
|
|
|
|
=head2 $new_set = $set->excise( $minlength | $size_set ) |
265
|
|
|
|
|
|
|
|
266
|
|
|
|
|
|
|
Removes all islands smaller than C<$minlength>. If C<$minlength> < 1 |
267
|
|
|
|
|
|
|
then no elements are removed and a copy of the set is returned. Since |
268
|
|
|
|
|
|
|
only islands smaller than C<$minlength> are removed, the smallest |
269
|
|
|
|
|
|
|
useful value for C<$minlength> is 2. |
270
|
|
|
|
|
|
|
|
271
|
|
|
|
|
|
|
If passed a set C<$size_set>, removes all islands whose size is found |
272
|
|
|
|
|
|
|
in C<$size_set>. This extended functionality allows you to pass in |
273
|
|
|
|
|
|
|
arbitrary size cutoffs. For example, to remove islands of size <=10 |
274
|
|
|
|
|
|
|
|
275
|
|
|
|
|
|
|
$new_set = $set->excise( Set::IntSpan->( "(-10" ) ) |
276
|
|
|
|
|
|
|
|
277
|
|
|
|
|
|
|
or to remove islands of size 2-10 |
278
|
|
|
|
|
|
|
|
279
|
|
|
|
|
|
|
$new_set = $set->excise( Set::IntSpan->( "2-10" ) ) |
280
|
|
|
|
|
|
|
|
281
|
|
|
|
|
|
|
Since size of an island must be non-zero and positive, any negative |
282
|
|
|
|
|
|
|
elements in the size set will be ignored. The two are therefore equivalent |
283
|
|
|
|
|
|
|
|
284
|
|
|
|
|
|
|
$new_set = $set->excise( Set::IntSpan->( "2-10" ) ) |
285
|
|
|
|
|
|
|
$new_set = $set->excise( Set::IntSpan->( "(--1,2-10" ) ) |
286
|
|
|
|
|
|
|
|
287
|
|
|
|
|
|
|
Using a size set allows you to excise islands larger than a certain |
288
|
|
|
|
|
|
|
size. For example, to remove all islands 10 or bigger, |
289
|
|
|
|
|
|
|
|
290
|
|
|
|
|
|
|
$new_set = $set->excise( Set::IntSpan->( "10-)" ) ) |
291
|
|
|
|
|
|
|
|
292
|
|
|
|
|
|
|
Regardless of input, if all islands are excised (i.e. all elements |
293
|
|
|
|
|
|
|
from $set are removed), this function will return an empty set. |
294
|
|
|
|
|
|
|
|
295
|
|
|
|
|
|
|
Contrast C to C. Use C when you have a set of |
296
|
|
|
|
|
|
|
island sizes you want to remove. Use C when you have a set of |
297
|
|
|
|
|
|
|
island sizes you want to keep. In other words, these are equivalent: |
298
|
|
|
|
|
|
|
|
299
|
|
|
|
|
|
|
$set->excise( $size_set ) |
300
|
|
|
|
|
|
|
$set->keep( $size_set->complement ) |
301
|
|
|
|
|
|
|
|
302
|
|
|
|
|
|
|
Strictly speaking, you can pass in any object as a size limiter, as |
303
|
|
|
|
|
|
|
long as it implements a C function which returns 1 if the |
304
|
|
|
|
|
|
|
size is in the cutoff set and 0 otherwise. |
305
|
|
|
|
|
|
|
|
306
|
|
|
|
|
|
|
$filter = Some::Other::Module->new(); |
307
|
|
|
|
|
|
|
# set $filter parameters according to Some::Other::Module API... |
308
|
|
|
|
|
|
|
... |
309
|
|
|
|
|
|
|
# $filter must implement "member" function |
310
|
|
|
|
|
|
|
$filter->can("member") |
311
|
|
|
|
|
|
|
if($filter->member(10)) { |
312
|
|
|
|
|
|
|
print "islands of size 10 will be removed"; |
313
|
|
|
|
|
|
|
} else { |
314
|
|
|
|
|
|
|
print "islands of size 10 will be kept"; |
315
|
|
|
|
|
|
|
} |
316
|
|
|
|
|
|
|
$set->excise($filter); |
317
|
|
|
|
|
|
|
|
318
|
|
|
|
|
|
|
=cut |
319
|
|
|
|
|
|
|
|
320
|
|
|
|
|
|
|
sub excise { |
321
|
43
|
|
|
43
|
1
|
460
|
my ($self,$length) = @_; |
322
|
43
|
100
|
|
|
|
177
|
if(! ref($length) ) { |
|
|
50
|
|
|
|
|
|
323
|
12
|
|
|
|
|
25
|
my $set = $self->new(); |
324
|
12
|
|
|
|
|
29
|
map { $set = $set->union($_) } grep($_->size >= $length, $self->sets); |
|
12
|
|
|
|
|
266
|
|
325
|
12
|
|
|
|
|
329
|
return $set; |
326
|
|
|
|
|
|
|
} elsif ($length->can("member")) { |
327
|
31
|
|
|
|
|
59
|
my $set = $self->new(); |
328
|
31
|
|
|
|
|
67
|
map { $set = $set->union($_) } grep(! $length->member($_->size), $self->sets); |
|
55
|
|
|
|
|
2841
|
|
329
|
31
|
|
|
|
|
1061
|
return $set; |
330
|
|
|
|
|
|
|
} else { |
331
|
0
|
|
|
|
|
0
|
confess "excise() does not accept a length cutoff of the type you used",ref($length); |
332
|
|
|
|
|
|
|
} |
333
|
|
|
|
|
|
|
} |
334
|
|
|
|
|
|
|
|
335
|
|
|
|
|
|
|
=head2 $new_set = $set->keep( $maxlength | $size_set ) |
336
|
|
|
|
|
|
|
|
337
|
|
|
|
|
|
|
If passed an integer C<$maxlength>, removes all islands larger than |
338
|
|
|
|
|
|
|
C<$maxlength>. |
339
|
|
|
|
|
|
|
|
340
|
|
|
|
|
|
|
If passed a set C<$size_set>, removes all islands whose size is not found |
341
|
|
|
|
|
|
|
in C<$size_set>. For example, to keep all islands sized 10 or larger, |
342
|
|
|
|
|
|
|
|
343
|
|
|
|
|
|
|
$new_set = $set->keep( Set::IntSpan->( "10-)" ) ) |
344
|
|
|
|
|
|
|
|
345
|
|
|
|
|
|
|
or keep all islands sized 2-10 |
346
|
|
|
|
|
|
|
|
347
|
|
|
|
|
|
|
$new_set = $set->excise( Set::IntSpan->( "2-10" ) ) |
348
|
|
|
|
|
|
|
|
349
|
|
|
|
|
|
|
Returns an empty set if no islands are kept. |
350
|
|
|
|
|
|
|
|
351
|
|
|
|
|
|
|
Since size of an island must be non-zero and positive, any negative |
352
|
|
|
|
|
|
|
elements in the size set will be ignored. The two are therefore equivalent |
353
|
|
|
|
|
|
|
|
354
|
|
|
|
|
|
|
$new_set = $set->keep( Set::IntSpan->( "2-10" ) ) |
355
|
|
|
|
|
|
|
$new_set = $set->keep( Set::IntSpan->( "(--1,2-10" ) ) |
356
|
|
|
|
|
|
|
|
357
|
|
|
|
|
|
|
Contrast C to C. Use C when you have a set of island |
358
|
|
|
|
|
|
|
sizes you want to keep. Use C when you have a set of island |
359
|
|
|
|
|
|
|
sizes you want to remove. In other words, these are equivalent: |
360
|
|
|
|
|
|
|
|
361
|
|
|
|
|
|
|
$set->keep( $size_set ) |
362
|
|
|
|
|
|
|
$set->excise( $size_set->complement ) |
363
|
|
|
|
|
|
|
|
364
|
|
|
|
|
|
|
Strictly speaking, you can pass in any object as a size limiter, as |
365
|
|
|
|
|
|
|
long as it implements a C function which returns 1 if the |
366
|
|
|
|
|
|
|
size is in the cutoff set and 0 otherwise. See the description of C for details. |
367
|
|
|
|
|
|
|
|
368
|
|
|
|
|
|
|
=cut |
369
|
|
|
|
|
|
|
|
370
|
|
|
|
|
|
|
sub keep { |
371
|
17
|
|
|
17
|
1
|
810
|
my ($self,$length) = @_; |
372
|
17
|
|
|
|
|
34
|
my $set = $self->new(); |
373
|
17
|
100
|
|
|
|
80
|
if(! ref($length) ) { |
|
|
50
|
|
|
|
|
|
374
|
5
|
|
|
|
|
13
|
map { $set = $set->union($_) } grep($_->size <= $length, $self->sets); |
|
2
|
|
|
|
|
45
|
|
375
|
|
|
|
|
|
|
} elsif ($length->can("member")) { |
376
|
12
|
|
|
|
|
25
|
map { $set = $set->union($_) } grep($length->member($_->size), $self->sets); |
|
11
|
|
|
|
|
477
|
|
377
|
|
|
|
|
|
|
} else { |
378
|
0
|
|
|
|
|
0
|
confess "keep() does not accept a length cutoff of the type you used",ref($length); |
379
|
|
|
|
|
|
|
} |
380
|
17
|
|
|
|
|
517
|
return $set; |
381
|
|
|
|
|
|
|
} |
382
|
|
|
|
|
|
|
|
383
|
|
|
|
|
|
|
=head2 $set = $set->fill( $maxsize | $size_set ) |
384
|
|
|
|
|
|
|
|
385
|
|
|
|
|
|
|
If passed an integer C<$maxsize>, fills in all holes in $set smaller than C<$maxsize>. |
386
|
|
|
|
|
|
|
|
387
|
|
|
|
|
|
|
If passed a set C<$size_set>, fills in all holes whose size appears in C<$size_set>. |
388
|
|
|
|
|
|
|
|
389
|
|
|
|
|
|
|
Strictly speaking, you can pass in any object as a size limiter, as |
390
|
|
|
|
|
|
|
long as it implements a C function which returns 1 if the |
391
|
|
|
|
|
|
|
size is in the cutoff set and 0 otherwise. See the description of C for details. |
392
|
|
|
|
|
|
|
|
393
|
|
|
|
|
|
|
=cut |
394
|
|
|
|
|
|
|
|
395
|
|
|
|
|
|
|
sub fill { |
396
|
14
|
|
|
14
|
1
|
281
|
my ($self,$length) = @_; |
397
|
14
|
|
|
|
|
31
|
my $set = $self->duplicate(); |
398
|
14
|
100
|
|
|
|
50
|
if(! ref($length)) { |
|
|
50
|
|
|
|
|
|
399
|
10
|
|
|
|
|
32
|
for my $hole ( $set->holes->sets ) { |
400
|
12
|
100
|
|
|
|
155
|
if($hole->size <= $length) { |
401
|
9
|
|
|
|
|
129
|
$set = $set->union($hole); |
402
|
|
|
|
|
|
|
} |
403
|
|
|
|
|
|
|
} |
404
|
|
|
|
|
|
|
} elsif ($length->can("member")) { |
405
|
4
|
|
|
|
|
14
|
for my $hole ( $set->holes->sets ) { |
406
|
14
|
100
|
|
|
|
384
|
if($length->member($hole->size)) { |
407
|
11
|
|
|
|
|
249
|
$set = $set->union($hole); |
408
|
|
|
|
|
|
|
} |
409
|
|
|
|
|
|
|
} |
410
|
|
|
|
|
|
|
} else { |
411
|
0
|
|
|
|
|
0
|
confess "fill() does not accept a length cutoff of the type you used",ref($length); |
412
|
|
|
|
|
|
|
} |
413
|
14
|
|
|
|
|
530
|
return $set; |
414
|
|
|
|
|
|
|
} |
415
|
|
|
|
|
|
|
|
416
|
|
|
|
|
|
|
=head2 $island_set = $set->find_islands( $integer | $another_set ) |
417
|
|
|
|
|
|
|
|
418
|
|
|
|
|
|
|
Returns a set composed of islands from $set that overlap with C<$integer> or C<$another_set>. |
419
|
|
|
|
|
|
|
|
420
|
|
|
|
|
|
|
If an integer is passed and C<$integer> is not in C<$set>, an empty set is returned. |
421
|
|
|
|
|
|
|
|
422
|
|
|
|
|
|
|
If a set is passed and C<$set> and C<$another_set> have an empty intersection, an empty set is returned. |
423
|
|
|
|
|
|
|
|
424
|
|
|
|
|
|
|
set ----xxxx---xxx-----xx-- |
425
|
|
|
|
|
|
|
another_set ------------x---------- |
426
|
|
|
|
|
|
|
island_set -----------xxx--------- |
427
|
|
|
|
|
|
|
|
428
|
|
|
|
|
|
|
set ----xxxx---xxx-----xx-- |
429
|
|
|
|
|
|
|
another_set ------------xxxxx------ |
430
|
|
|
|
|
|
|
island_set -----------xxx--------- |
431
|
|
|
|
|
|
|
|
432
|
|
|
|
|
|
|
set ----xxxx---xxx-----xx-- |
433
|
|
|
|
|
|
|
another_set ------------xxxxx---xx- |
434
|
|
|
|
|
|
|
island_set -----------xxx-----xx-- |
435
|
|
|
|
|
|
|
|
436
|
|
|
|
|
|
|
Contrast this to nearest_island() which returns the closest island(s) that |
437
|
|
|
|
|
|
|
do not overlap with C<$integer> or C<$another_set>. |
438
|
|
|
|
|
|
|
|
439
|
|
|
|
|
|
|
=cut |
440
|
|
|
|
|
|
|
|
441
|
|
|
|
|
|
|
sub find_islands { |
442
|
13
|
|
|
13
|
1
|
294
|
my ($self,$anchor) = @_; |
443
|
13
|
100
|
|
|
|
37
|
return $self->new() if ! $anchor; |
444
|
12
|
100
|
|
|
|
108
|
if(! ref($anchor)) { |
|
|
50
|
|
|
|
|
|
445
|
7
|
|
|
|
|
16
|
for my $set ($self->sets) { |
446
|
11
|
100
|
|
|
|
86
|
return $set if $set->member($anchor); |
447
|
|
|
|
|
|
|
} |
448
|
2
|
|
|
|
|
35
|
return $self->new(); |
449
|
|
|
|
|
|
|
} elsif ($anchor->can("intersect")) { |
450
|
5
|
|
|
|
|
13
|
my $islands = $self->new; |
451
|
5
|
100
|
|
|
|
13
|
return $islands if ! $self->overlap($anchor); |
452
|
4
|
|
|
|
|
221
|
for my $set ($self->sets) { |
453
|
8
|
100
|
|
|
|
149
|
$islands->U($set) if $set->overlap($anchor); |
454
|
|
|
|
|
|
|
} |
455
|
4
|
|
|
|
|
114
|
return $islands; |
456
|
|
|
|
|
|
|
} else { |
457
|
0
|
|
|
|
|
0
|
confess "find_islands does not accept an argument of the type you used",ref($anchor); |
458
|
|
|
|
|
|
|
} |
459
|
|
|
|
|
|
|
} |
460
|
|
|
|
|
|
|
|
461
|
|
|
|
|
|
|
=pod |
462
|
|
|
|
|
|
|
|
463
|
|
|
|
|
|
|
=head2 $island_set = $set->nearest_island( $integer | $another_set) |
464
|
|
|
|
|
|
|
|
465
|
|
|
|
|
|
|
Returns the island(s) in C<$set> closest (but not overlapping) to |
466
|
|
|
|
|
|
|
C<$integer> or C<$another_set>. If C<$integer> or C<$another_set> lie |
467
|
|
|
|
|
|
|
exactly between two islands, then the returned set contains these two |
468
|
|
|
|
|
|
|
islands. |
469
|
|
|
|
|
|
|
|
470
|
|
|
|
|
|
|
If no non-overlapping islands in $set are found, an empty set is returned. |
471
|
|
|
|
|
|
|
|
472
|
|
|
|
|
|
|
set ----xxxx---xxx-----xx-- |
473
|
|
|
|
|
|
|
another_set ------------x---------- |
474
|
|
|
|
|
|
|
island_set ----xxxx--------------- |
475
|
|
|
|
|
|
|
|
476
|
|
|
|
|
|
|
set ----xxxx---xxx-----xx-- |
477
|
|
|
|
|
|
|
another_set ------------xxxxx------ |
478
|
|
|
|
|
|
|
island_set -------------------xx-- |
479
|
|
|
|
|
|
|
|
480
|
|
|
|
|
|
|
set ----xxxx---xxx-----xx-- |
481
|
|
|
|
|
|
|
another_set ----------xxxxxxx------ |
482
|
|
|
|
|
|
|
island_set ----xxxx-----------xx-- |
483
|
|
|
|
|
|
|
|
484
|
|
|
|
|
|
|
If $another_set contains multiple islands, such as below, $island_set |
485
|
|
|
|
|
|
|
may also contain multiple islands. |
486
|
|
|
|
|
|
|
|
487
|
|
|
|
|
|
|
set ----xxxx---xxx-----xx-- |
488
|
|
|
|
|
|
|
another_set ---x----xxx------------ |
489
|
|
|
|
|
|
|
island_set ----xxxx---xxx--------- |
490
|
|
|
|
|
|
|
|
491
|
|
|
|
|
|
|
Contrast this to C which returns the island(s) that |
492
|
|
|
|
|
|
|
overlap with C<$integer> or C<$another_set>. |
493
|
|
|
|
|
|
|
|
494
|
|
|
|
|
|
|
=cut |
495
|
|
|
|
|
|
|
|
496
|
|
|
|
|
|
|
sub nearest_island { |
497
|
21
|
|
|
21
|
1
|
776
|
my ($self,$anchor) = @_; |
498
|
21
|
100
|
|
|
|
87
|
if(! ref($anchor)) { |
|
|
50
|
|
|
|
|
|
499
|
8
|
|
|
|
|
16
|
$anchor = $self->new($anchor); |
500
|
|
|
|
|
|
|
} elsif ($anchor->can("sets")) { |
501
|
|
|
|
|
|
|
# same type of object |
502
|
|
|
|
|
|
|
} else { |
503
|
0
|
|
|
|
|
0
|
confess "nearest_island does not accept an argument of the type you used",ref($anchor); |
504
|
|
|
|
|
|
|
} |
505
|
21
|
|
|
|
|
38
|
my $island = $self->new(); |
506
|
21
|
|
|
|
|
25
|
my $min_d; |
507
|
21
|
|
|
|
|
37
|
for my $s ($self->sets) { |
508
|
38
|
|
|
|
|
260
|
for my $ss ($anchor->sets) { |
509
|
44
|
100
|
|
|
|
1536
|
next if $s->overlap($ss); |
510
|
34
|
|
|
|
|
1033
|
my $d = $s->distance($ss); |
511
|
34
|
100
|
100
|
|
|
120
|
if(! defined $min_d || $d <= $min_d) { |
512
|
26
|
100
|
100
|
|
|
64
|
if(defined $min_d && $d == $min_d) { |
513
|
5
|
|
|
|
|
14
|
$island = $island->union($s); |
514
|
|
|
|
|
|
|
} else { |
515
|
21
|
|
|
|
|
20
|
$min_d = $d; |
516
|
21
|
|
|
|
|
67
|
$island = $s; |
517
|
|
|
|
|
|
|
} |
518
|
|
|
|
|
|
|
} |
519
|
|
|
|
|
|
|
} |
520
|
|
|
|
|
|
|
} |
521
|
21
|
|
|
|
|
478
|
return $island; |
522
|
|
|
|
|
|
|
} |
523
|
|
|
|
|
|
|
|
524
|
|
|
|
|
|
|
=pod |
525
|
|
|
|
|
|
|
|
526
|
|
|
|
|
|
|
=head2 $num_islands = $set->num_islands() |
527
|
|
|
|
|
|
|
|
528
|
|
|
|
|
|
|
Returns the number of islands in the set. If the set is empty, 0 is returned. |
529
|
|
|
|
|
|
|
|
530
|
|
|
|
|
|
|
=cut |
531
|
|
|
|
|
|
|
|
532
|
|
|
|
|
|
|
sub num_islands { |
533
|
39
|
|
|
39
|
1
|
119
|
my $self = shift; |
534
|
39
|
|
|
|
|
124
|
return scalar $self->spans; |
535
|
|
|
|
|
|
|
} |
536
|
|
|
|
|
|
|
|
537
|
|
|
|
|
|
|
=head2 $island = $set->at_island( $island_index ) |
538
|
|
|
|
|
|
|
|
539
|
|
|
|
|
|
|
Returns the island indexed by $island_index. Islands are |
540
|
|
|
|
|
|
|
0-indexed. For a set with N islands, the first island (ordered |
541
|
|
|
|
|
|
|
left-to-right) has index 0 and the last island has index N-1. |
542
|
|
|
|
|
|
|
|
543
|
|
|
|
|
|
|
If $island_index is negative, counting is done back from the last |
544
|
|
|
|
|
|
|
island. |
545
|
|
|
|
|
|
|
|
546
|
|
|
|
|
|
|
If $island_index is beyond the last island, undef is returned. |
547
|
|
|
|
|
|
|
|
548
|
|
|
|
|
|
|
=cut |
549
|
|
|
|
|
|
|
|
550
|
|
|
|
|
|
|
sub at_island { |
551
|
140
|
|
|
140
|
1
|
262
|
my ($self,$n) = @_; |
552
|
140
|
|
|
|
|
275
|
my @islands = $self->sets; |
553
|
140
|
100
|
100
|
|
|
1401
|
return defined $n && defined $islands[$n] ? $islands[$n] : undef; |
554
|
|
|
|
|
|
|
} |
555
|
|
|
|
|
|
|
|
556
|
|
|
|
|
|
|
=pod |
557
|
|
|
|
|
|
|
|
558
|
|
|
|
|
|
|
=head2 $island = $set->first_island() |
559
|
|
|
|
|
|
|
|
560
|
|
|
|
|
|
|
Returns the first island of the set. As a side-effect, sets the |
561
|
|
|
|
|
|
|
iterator to the first island. |
562
|
|
|
|
|
|
|
|
563
|
|
|
|
|
|
|
If the set is empty, returns undef. |
564
|
|
|
|
|
|
|
|
565
|
|
|
|
|
|
|
=cut |
566
|
|
|
|
|
|
|
|
567
|
|
|
|
|
|
|
sub first_island { |
568
|
11
|
|
|
11
|
1
|
55
|
my $self = shift; |
569
|
11
|
100
|
|
|
|
40
|
if($self->cardinality) { |
570
|
9
|
|
|
|
|
103
|
$self->{iterator} = 0; |
571
|
9
|
|
|
|
|
20
|
return $self->at_island( $self->{iterator} ); |
572
|
|
|
|
|
|
|
} else { |
573
|
2
|
|
|
|
|
29
|
$self->{iterator} = undef; |
574
|
2
|
|
|
|
|
15
|
return undef; |
575
|
|
|
|
|
|
|
} |
576
|
|
|
|
|
|
|
} |
577
|
|
|
|
|
|
|
|
578
|
|
|
|
|
|
|
=pod |
579
|
|
|
|
|
|
|
|
580
|
|
|
|
|
|
|
=head2 $island = $set->last_island() |
581
|
|
|
|
|
|
|
|
582
|
|
|
|
|
|
|
Returns the last island of the set. As a side-effect, sets the |
583
|
|
|
|
|
|
|
iterator to the last island. |
584
|
|
|
|
|
|
|
|
585
|
|
|
|
|
|
|
If the set is empty, returns undef. |
586
|
|
|
|
|
|
|
|
587
|
|
|
|
|
|
|
=cut |
588
|
|
|
|
|
|
|
|
589
|
|
|
|
|
|
|
sub last_island { |
590
|
9
|
|
|
9
|
1
|
44
|
my $self = shift; |
591
|
9
|
50
|
|
|
|
24
|
if($self->cardinality) { |
592
|
9
|
|
|
|
|
181
|
$self->{iterator} = $self->num_islands - 1; |
593
|
9
|
|
|
|
|
230
|
return $self->at_island( $self->{iterator} ); |
594
|
|
|
|
|
|
|
} else { |
595
|
0
|
|
|
|
|
0
|
$self->{iterator} = undef; |
596
|
0
|
|
|
|
|
0
|
return undef; |
597
|
|
|
|
|
|
|
} |
598
|
|
|
|
|
|
|
} |
599
|
|
|
|
|
|
|
|
600
|
|
|
|
|
|
|
=pod |
601
|
|
|
|
|
|
|
|
602
|
|
|
|
|
|
|
=head2 $island = $set->next_island() |
603
|
|
|
|
|
|
|
|
604
|
|
|
|
|
|
|
Advances the iterator forward by one island, and returns the next |
605
|
|
|
|
|
|
|
island. If the iterator is undefined, the first island is returned. |
606
|
|
|
|
|
|
|
|
607
|
|
|
|
|
|
|
Returns undef if the set is empty or if no more islands are available. |
608
|
|
|
|
|
|
|
|
609
|
|
|
|
|
|
|
=cut |
610
|
|
|
|
|
|
|
|
611
|
|
|
|
|
|
|
sub next_island { |
612
|
29
|
|
|
29
|
1
|
19520
|
my $self = shift; |
613
|
|
|
|
|
|
|
|
614
|
29
|
100
|
|
|
|
91
|
if($self->cardinality) { |
615
|
28
|
100
|
|
|
|
366
|
$self->{iterator} = defined $self->{iterator} ? ++$self->{iterator} : 0; |
616
|
28
|
|
|
|
|
72
|
my $next = $self->at_island( $self->{iterator} ); |
617
|
28
|
100
|
|
|
|
108
|
if($next) { |
618
|
18
|
|
|
|
|
262
|
return $next; |
619
|
|
|
|
|
|
|
} else { |
620
|
10
|
|
|
|
|
21
|
$self->{iterator} = undef; |
621
|
10
|
|
|
|
|
28
|
return undef; |
622
|
|
|
|
|
|
|
} |
623
|
|
|
|
|
|
|
} else { |
624
|
1
|
|
|
|
|
16
|
$self->{iterator} = undef; |
625
|
1
|
|
|
|
|
5
|
return undef; |
626
|
|
|
|
|
|
|
} |
627
|
|
|
|
|
|
|
} |
628
|
|
|
|
|
|
|
|
629
|
|
|
|
|
|
|
=pod |
630
|
|
|
|
|
|
|
|
631
|
|
|
|
|
|
|
=head2 $island = $set->prev_island() |
632
|
|
|
|
|
|
|
|
633
|
|
|
|
|
|
|
Reverses the iterator backward by one island, and returns the previous |
634
|
|
|
|
|
|
|
island. If the iterator is undefined, the last island is returned. |
635
|
|
|
|
|
|
|
|
636
|
|
|
|
|
|
|
Returns undef if the set is empty or if no more islands are available. |
637
|
|
|
|
|
|
|
|
638
|
|
|
|
|
|
|
=cut |
639
|
|
|
|
|
|
|
|
640
|
|
|
|
|
|
|
sub prev_island { |
641
|
29
|
|
|
29
|
1
|
12784
|
my $self = shift; |
642
|
29
|
100
|
|
|
|
80
|
if($self->cardinality) { |
643
|
28
|
100
|
|
|
|
368
|
$self->{iterator} = defined $self->{iterator} ? --$self->{iterator} : $self->num_islands - 1; |
644
|
28
|
100
|
|
|
|
281
|
if($self->{iterator} >= 0) { |
645
|
18
|
|
|
|
|
62
|
return $self->at_island( $self->{iterator} ); |
646
|
|
|
|
|
|
|
} else { |
647
|
10
|
|
|
|
|
36
|
$self->{iterator} = undef; |
648
|
10
|
|
|
|
|
27
|
return undef; |
649
|
|
|
|
|
|
|
} |
650
|
|
|
|
|
|
|
} else { |
651
|
1
|
|
|
|
|
13
|
$self->{iterator} = undef; |
652
|
1
|
|
|
|
|
3
|
return undef; |
653
|
|
|
|
|
|
|
} |
654
|
|
|
|
|
|
|
} |
655
|
|
|
|
|
|
|
|
656
|
|
|
|
|
|
|
=pod |
657
|
|
|
|
|
|
|
|
658
|
|
|
|
|
|
|
=head2 $island = $set->current_island() |
659
|
|
|
|
|
|
|
|
660
|
|
|
|
|
|
|
Returns the island at the current iterator position. |
661
|
|
|
|
|
|
|
|
662
|
|
|
|
|
|
|
Returns undef if the set is empty or if the iterator is not defined. |
663
|
|
|
|
|
|
|
|
664
|
|
|
|
|
|
|
=cut |
665
|
|
|
|
|
|
|
|
666
|
|
|
|
|
|
|
sub current_island { |
667
|
58
|
|
|
58
|
1
|
5899
|
my $self = shift; |
668
|
58
|
|
|
|
|
147
|
return $self->at_island( $self->{iterator} ); |
669
|
|
|
|
|
|
|
} |
670
|
|
|
|
|
|
|
|
671
|
|
|
|
|
|
|
=pod |
672
|
|
|
|
|
|
|
|
673
|
|
|
|
|
|
|
=head2 $cover_data = Set::IntSpan::Island->extract_covers( $set_hash_ref ) |
674
|
|
|
|
|
|
|
|
675
|
|
|
|
|
|
|
Given a C<$set_hash> reference |
676
|
|
|
|
|
|
|
|
677
|
|
|
|
|
|
|
{ id1=>$set1, id2=>$set2, ..., idn=>$setn} |
678
|
|
|
|
|
|
|
|
679
|
|
|
|
|
|
|
where C<$setj> is a finite C object and C |
680
|
|
|
|
|
|
|
is a unique key, C performs an exhaustive intersection |
681
|
|
|
|
|
|
|
of all sets and returns a list of all covers and set memberships. For |
682
|
|
|
|
|
|
|
example, given the id/runlist combination |
683
|
|
|
|
|
|
|
|
684
|
|
|
|
|
|
|
a 10-15 |
685
|
|
|
|
|
|
|
b 12 |
686
|
|
|
|
|
|
|
c 14-20 |
687
|
|
|
|
|
|
|
d 25 |
688
|
|
|
|
|
|
|
|
689
|
|
|
|
|
|
|
The covers are |
690
|
|
|
|
|
|
|
|
691
|
|
|
|
|
|
|
10-11 a |
692
|
|
|
|
|
|
|
12 a b |
693
|
|
|
|
|
|
|
13 a |
694
|
|
|
|
|
|
|
14-15 a c |
695
|
|
|
|
|
|
|
16-20 c |
696
|
|
|
|
|
|
|
21-24 - |
697
|
|
|
|
|
|
|
25 d |
698
|
|
|
|
|
|
|
|
699
|
|
|
|
|
|
|
The cover data is returned as an array reference and its structure is |
700
|
|
|
|
|
|
|
|
701
|
|
|
|
|
|
|
[ [ $cover_set1, [ id11, id12, id13, ... ] ], |
702
|
|
|
|
|
|
|
[ $cover_set2, [ id21, id22, id23, ... ] ], |
703
|
|
|
|
|
|
|
... |
704
|
|
|
|
|
|
|
] |
705
|
|
|
|
|
|
|
|
706
|
|
|
|
|
|
|
If a cover contains no elements, then its entry is |
707
|
|
|
|
|
|
|
|
708
|
|
|
|
|
|
|
[ $cover_set, [ ] ] |
709
|
|
|
|
|
|
|
|
710
|
|
|
|
|
|
|
=cut |
711
|
|
|
|
|
|
|
|
712
|
|
|
|
|
|
|
sub extract_covers { |
713
|
115
|
|
|
115
|
1
|
5901
|
my ($self,$sets) = @_; |
714
|
|
|
|
|
|
|
|
715
|
115
|
50
|
33
|
|
|
943
|
if(! $sets || ref($sets) ne "HASH") { |
716
|
0
|
|
|
|
|
0
|
return []; |
717
|
|
|
|
|
|
|
} |
718
|
|
|
|
|
|
|
|
719
|
|
|
|
|
|
|
# decompose all input sets into spans |
720
|
115
|
|
|
|
|
156
|
my @sets; |
721
|
115
|
|
|
|
|
788
|
for my $id (keys %$sets) { |
722
|
5047
|
50
|
|
|
|
28304
|
confess "value in hash is not a set object" unless $sets->{$id}->can("sets"); |
723
|
5047
|
|
|
|
|
12829
|
for my $span ($sets->{$id}->sets) { |
724
|
53832
|
|
|
|
|
199481
|
push @sets,[$id,$span]; |
725
|
|
|
|
|
|
|
} |
726
|
|
|
|
|
|
|
} |
727
|
|
|
|
|
|
|
# order the spans by increasing min and increasing max |
728
|
115
|
50
|
|
|
|
965670
|
@sets = sort {$a->[1]->min <=> $b->[1]->min || $a->[1]->max <=> $b->[1]->max} @sets; |
|
410908
|
|
|
|
|
12930404
|
|
729
|
|
|
|
|
|
|
# register integers at which cover set membership may change - these are the |
730
|
|
|
|
|
|
|
# integers at set boundaries |
731
|
115
|
|
|
|
|
4440
|
my %edges; |
732
|
115
|
|
|
|
|
418
|
for my $set (@sets) { |
733
|
53832
|
|
|
|
|
77523
|
map {$edges{$_}++} ( map { ($_->[1]->min-1,$_->[1]->min,$_->[1]->max,$_->[1]->max+1) } $set ); |
|
215328
|
|
|
|
|
2381805
|
|
|
53832
|
|
|
|
|
158850
|
|
734
|
|
|
|
|
|
|
} |
735
|
115
|
|
|
|
|
3478
|
my @edges = sort {$a <=> $b} keys %edges; |
|
42404
|
|
|
|
|
42618
|
|
736
|
|
|
|
|
|
|
# first and last edge are not part of any set (min(leftmost)-1, max(rightmost)+1) - remove them |
737
|
115
|
|
|
|
|
818
|
splice(@edges,0,1); |
738
|
115
|
|
|
|
|
306
|
splice(@edges,-1,1); |
739
|
115
|
|
|
|
|
214
|
my $i = 0; |
740
|
115
|
|
|
|
|
226
|
my $j_low = 0; |
741
|
115
|
|
|
|
|
145
|
my $covers; |
742
|
|
|
|
|
|
|
#print "edges ",join(" ",@edges),"\n"; |
743
|
115
|
|
|
|
|
468
|
while($i < @edges) { |
744
|
5356
|
|
|
|
|
8610
|
my $edge = $edges[$i]; |
745
|
5356
|
|
|
|
|
8388
|
my $edge_next = $edges[$i+1]; |
746
|
5356
|
|
|
|
|
5411
|
my $cover; |
747
|
5356
|
100
|
100
|
|
|
23789
|
if(! defined $edge_next || $edge + 1 == $edge_next) { |
748
|
2671
|
|
|
|
|
6688
|
$cover = $self->new($edge); |
749
|
2671
|
|
|
|
|
3927
|
$i++; |
750
|
|
|
|
|
|
|
} else { |
751
|
2685
|
|
|
|
|
7789
|
$cover = $self->new($edge,$edge_next); |
752
|
2685
|
|
|
|
|
4025
|
$i += 2; |
753
|
|
|
|
|
|
|
} |
754
|
|
|
|
|
|
|
#printf("cover %3d %3d j_low %d\n",$cover->min,$cover->max,$j_low); |
755
|
5356
|
|
|
|
|
6344
|
my $found; |
756
|
5356
|
|
|
|
|
7749
|
my $j_low_incr = 0; |
757
|
5356
|
|
|
|
|
13259
|
push @$covers, [ $cover , []]; |
758
|
5356
|
|
|
|
|
15305
|
for my $j ($j_low..@sets-1) { |
759
|
240544
|
|
|
|
|
1771917
|
my ($id,$set) = @{$sets[$j]}; |
|
240544
|
|
|
|
|
547653
|
|
760
|
240544
|
|
|
|
|
542158
|
my $ol = $set->overlap($cover); |
761
|
240544
|
100
|
|
|
|
12011893
|
if($ol) { |
762
|
99046
|
|
|
|
|
127734
|
$found = 1; |
763
|
|
|
|
|
|
|
#print " ",$sets[$j][0]," ",$set->run_list,"\n" if $ol; |
764
|
99046
|
|
|
|
|
97755
|
push @{$covers->[-1][1]}, $id; |
|
99046
|
|
|
|
|
309115
|
|
765
|
|
|
|
|
|
|
} else { |
766
|
141498
|
100
|
|
|
|
227906
|
if($found) { |
767
|
78063
|
100
|
|
|
|
176434
|
last if $set->min > $cover->max; |
768
|
|
|
|
|
|
|
} else { |
769
|
63435
|
|
|
|
|
111326
|
$j_low_incr++; |
770
|
|
|
|
|
|
|
} |
771
|
|
|
|
|
|
|
} |
772
|
|
|
|
|
|
|
} |
773
|
5356
|
100
|
100
|
|
|
124445
|
if(@$covers > 1 && |
|
5241
|
|
|
|
|
21668
|
|
774
|
5241
|
|
|
|
|
40085
|
join("",@{$covers->[-1][1]}) eq join("",@{$covers->[-2][1]})) { |
775
|
773
|
|
|
|
|
4003
|
$covers->[-2][0] = $covers->[-2][0]->union ($covers->[-1][0]); |
776
|
773
|
|
|
|
|
28313
|
splice(@$covers,-1,1); |
777
|
|
|
|
|
|
|
} |
778
|
5356
|
100
|
|
|
|
24423
|
$j_low += $j_low_incr if $found; |
779
|
|
|
|
|
|
|
} |
780
|
115
|
|
|
|
|
117521
|
return $covers; |
781
|
|
|
|
|
|
|
} |
782
|
|
|
|
|
|
|
|
783
|
|
|
|
|
|
|
1; |
784
|
|
|
|
|
|
|
|
785
|
|
|
|
|
|
|
__END__ |