line |
stmt |
bran |
cond |
sub |
pod |
time |
code |
1
|
|
|
|
|
|
|
package Array::OverlapFinder; |
2
|
|
|
|
|
|
|
|
3
|
|
|
|
|
|
|
our $AUTHORITY = 'cpan:PERLANCAR'; # AUTHORITY |
4
|
|
|
|
|
|
|
our $DATE = '2021-01-02'; # DATE |
5
|
|
|
|
|
|
|
our $DIST = 'Array-OverlapFinder'; # DIST |
6
|
|
|
|
|
|
|
our $VERSION = '0.005'; # VERSION |
7
|
|
|
|
|
|
|
|
8
|
1
|
|
|
1
|
|
55894
|
use 5.010001; |
|
1
|
|
|
|
|
11
|
|
9
|
1
|
|
|
1
|
|
6
|
use strict; |
|
1
|
|
|
|
|
1
|
|
|
1
|
|
|
|
|
20
|
|
10
|
1
|
|
|
1
|
|
4
|
use warnings; |
|
1
|
|
|
|
|
2
|
|
|
1
|
|
|
|
|
33
|
|
11
|
|
|
|
|
|
|
|
12
|
1
|
|
|
1
|
|
6
|
use Exporter qw(import); |
|
1
|
|
|
|
|
1
|
|
|
1
|
|
|
|
|
368
|
|
13
|
|
|
|
|
|
|
our @EXPORT_OK = qw(find_overlap combine_overlap); |
14
|
|
|
|
|
|
|
|
15
|
|
|
|
|
|
|
sub _find_or_combine_overlap { |
16
|
28
|
|
|
28
|
|
45
|
my $action = shift; |
17
|
28
|
100
|
|
|
|
62
|
my $opts = ref($_[0]) eq 'HASH' ? shift : {}; |
18
|
28
|
|
|
|
|
49
|
my $detail = $opts->{detail}; |
19
|
28
|
50
|
|
|
|
56
|
@_ >= 2 or die "Please supply at least two sequences"; |
20
|
|
|
|
|
|
|
|
21
|
28
|
|
|
|
|
35
|
my @detail_res; |
22
|
|
|
|
|
|
|
my @all_overlap_items; |
23
|
|
|
|
|
|
|
|
24
|
28
|
|
|
|
|
32
|
my $seq1 = shift; |
25
|
28
|
|
|
|
|
31
|
my $num_seqs = 1; |
26
|
|
|
|
|
|
|
SEQ: |
27
|
28
|
|
|
|
|
50
|
while (@_) { |
28
|
32
|
|
|
|
|
35
|
my $seq2 = shift; |
29
|
32
|
|
|
|
|
34
|
$num_seqs++; |
30
|
|
|
|
|
|
|
|
31
|
32
|
|
|
|
|
38
|
my @overlap_items; |
32
|
|
|
|
|
|
|
my $index_at_seq1; |
33
|
|
|
|
|
|
|
|
34
|
|
|
|
|
|
|
L1: |
35
|
32
|
|
|
|
|
35
|
for my $i (0 .. $#{$seq1}) { |
|
32
|
|
|
|
|
66
|
|
36
|
92
|
|
|
|
|
100
|
my $j = $i; |
37
|
92
|
|
100
|
|
|
97
|
while ($j <= $#{$seq1} && ($j-$i) <= $#{$seq2}) { |
|
160
|
|
|
|
|
248
|
|
|
140
|
|
|
|
|
262
|
|
38
|
136
|
100
|
|
|
|
260
|
if ($seq1->[$j] ne $seq2->[$j - $i]) { |
39
|
68
|
|
|
|
|
106
|
next L1; |
40
|
|
|
|
|
|
|
} |
41
|
68
|
|
|
|
|
72
|
$j++; |
42
|
|
|
|
|
|
|
} |
43
|
24
|
|
|
|
|
30
|
@overlap_items = @{$seq1}[$i .. $#{$seq1}]; |
|
24
|
|
|
|
|
50
|
|
|
24
|
|
|
|
|
39
|
|
44
|
24
|
|
|
|
|
41
|
$index_at_seq1 = $i; |
45
|
24
|
|
|
|
|
37
|
last L1; |
46
|
|
|
|
|
|
|
} |
47
|
|
|
|
|
|
|
|
48
|
32
|
|
|
|
|
42
|
my @combined; |
49
|
32
|
100
|
|
|
|
76
|
if (defined $index_at_seq1) { |
50
|
24
|
|
|
|
|
33
|
@combined = (@$seq1, @{$seq2}[ ($#{$seq1} - $index_at_seq1 + 1) .. $#{$seq2} ]); |
|
24
|
|
|
|
|
45
|
|
|
24
|
|
|
|
|
34
|
|
|
24
|
|
|
|
|
28
|
|
51
|
|
|
|
|
|
|
} else { |
52
|
8
|
|
|
|
|
19
|
@combined = (@$seq1, @$seq2); |
53
|
|
|
|
|
|
|
} |
54
|
32
|
|
|
|
|
49
|
$seq1 = \@combined; |
55
|
|
|
|
|
|
|
|
56
|
32
|
|
|
|
|
47
|
push @detail_res, \@overlap_items, $index_at_seq1; |
57
|
32
|
|
|
|
|
69
|
push @all_overlap_items, \@overlap_items; |
58
|
|
|
|
|
|
|
} # SEQ |
59
|
|
|
|
|
|
|
|
60
|
28
|
100
|
|
|
|
47
|
if ($action eq 'find') { |
61
|
14
|
100
|
|
|
|
20
|
if ($detail) { |
62
|
7
|
|
|
|
|
39
|
return @detail_res; |
63
|
|
|
|
|
|
|
} else { |
64
|
7
|
100
|
|
|
|
10
|
if ($num_seqs > 2) { |
65
|
1
|
|
|
|
|
7
|
return @all_overlap_items; |
66
|
|
|
|
|
|
|
} else { |
67
|
6
|
|
|
|
|
6
|
return @{ $all_overlap_items[0] }; |
|
6
|
|
|
|
|
39
|
|
68
|
|
|
|
|
|
|
} |
69
|
|
|
|
|
|
|
} |
70
|
|
|
|
|
|
|
} else { |
71
|
|
|
|
|
|
|
# combine |
72
|
14
|
100
|
|
|
|
21
|
if ($detail) { |
73
|
7
|
|
|
|
|
42
|
return ($seq1, @detail_res); |
74
|
|
|
|
|
|
|
} else { |
75
|
7
|
|
|
|
|
48
|
return @$seq1; |
76
|
|
|
|
|
|
|
} |
77
|
|
|
|
|
|
|
} |
78
|
|
|
|
|
|
|
} |
79
|
|
|
|
|
|
|
|
80
|
14
|
|
|
14
|
1
|
1028
|
sub find_overlap { _find_or_combine_overlap('find', @_) } |
81
|
|
|
|
|
|
|
|
82
|
14
|
|
|
14
|
1
|
2635
|
sub combine_overlap { _find_or_combine_overlap('combine', @_) } |
83
|
|
|
|
|
|
|
|
84
|
|
|
|
|
|
|
1; |
85
|
|
|
|
|
|
|
# ABSTRACT: Find/remove overlapping items among ordered sequences |
86
|
|
|
|
|
|
|
|
87
|
|
|
|
|
|
|
__END__ |