| line | stmt | bran | cond | sub | pod | time | code | 
| 1 |  |  |  |  |  |  | package Array::OverlapFinder; | 
| 2 |  |  |  |  |  |  |  | 
| 3 |  |  |  |  |  |  | our $AUTHORITY = 'cpan:PERLANCAR'; # AUTHORITY | 
| 4 |  |  |  |  |  |  | our $DATE = '2021-01-02'; # DATE | 
| 5 |  |  |  |  |  |  | our $DIST = 'Array-OverlapFinder'; # DIST | 
| 6 |  |  |  |  |  |  | our $VERSION = '0.004'; # VERSION | 
| 7 |  |  |  |  |  |  |  | 
| 8 | 1 |  |  | 1 |  | 68236 | use 5.010001; | 
|  | 1 |  |  |  |  | 13 |  | 
| 9 | 1 |  |  | 1 |  | 29 | use strict; | 
|  | 1 |  |  |  |  | 2 |  | 
|  | 1 |  |  |  |  | 82 |  | 
| 10 | 1 |  |  | 1 |  | 9 | use warnings; | 
|  | 1 |  |  |  |  | 2 |  | 
|  | 1 |  |  |  |  | 46 |  | 
| 11 |  |  |  |  |  |  |  | 
| 12 | 1 |  |  | 1 |  | 7 | use Exporter qw(import); | 
|  | 1 |  |  |  |  | 1 |  | 
|  | 1 |  |  |  |  | 452 |  | 
| 13 |  |  |  |  |  |  | our @EXPORT_OK = qw(find_overlap combine_overlap); | 
| 14 |  |  |  |  |  |  |  | 
| 15 |  |  |  |  |  |  | sub _find_or_combine_overlap { | 
| 16 | 28 |  |  | 28 |  | 51 | my $action = shift; | 
| 17 | 28 | 100 |  |  |  | 83 | my $opts = ref($_[0]) eq 'HASH' ? shift : {}; | 
| 18 | 28 |  |  |  |  | 44 | my $detail = $opts->{detail}; | 
| 19 | 28 | 50 |  |  |  | 73 | @_ >= 2 or die "Please supply at least two sequences"; | 
| 20 |  |  |  |  |  |  |  | 
| 21 | 28 |  |  |  |  | 40 | my @detail_res; | 
| 22 |  |  |  |  |  |  | my @all_overlap_items; | 
| 23 |  |  |  |  |  |  |  | 
| 24 | 28 |  |  |  |  | 43 | my $seq1 = shift; | 
| 25 | 28 |  |  |  |  | 37 | my $num_seqs = 1; | 
| 26 |  |  |  |  |  |  | SEQ: | 
| 27 | 28 |  |  |  |  | 58 | while (@_) { | 
| 28 | 32 |  |  |  |  | 41 | my $seq2 = shift; | 
| 29 | 32 |  |  |  |  | 44 | $num_seqs++; | 
| 30 |  |  |  |  |  |  |  | 
| 31 | 32 |  |  |  |  | 45 | my @overlap_items; | 
| 32 |  |  |  |  |  |  | my $index_at_seq1; | 
| 33 |  |  |  |  |  |  |  | 
| 34 |  |  |  |  |  |  | L1: | 
| 35 | 32 |  |  |  |  | 44 | for my $i (0 .. $#{$seq1}) { | 
|  | 32 |  |  |  |  | 81 |  | 
| 36 | 92 |  |  |  |  | 122 | my $j = $i; | 
| 37 | 92 |  | 100 |  |  | 110 | while ($j <= $#{$seq1} && ($j-$i) <= $#{$seq2}) { | 
|  | 160 |  |  |  |  | 317 |  | 
|  | 140 |  |  |  |  | 313 |  | 
| 38 | 136 | 100 |  |  |  | 313 | if ($seq1->[$j] ne $seq2->[$j - $i]) { | 
| 39 | 68 |  |  |  |  | 135 | next L1; | 
| 40 |  |  |  |  |  |  | } | 
| 41 | 68 |  |  |  |  | 91 | $j++; | 
| 42 |  |  |  |  |  |  | } | 
| 43 | 24 |  |  |  |  | 40 | @overlap_items = @{$seq1}[$i .. $#{$seq1}]; | 
|  | 24 |  |  |  |  | 64 |  | 
|  | 24 |  |  |  |  | 37 |  | 
| 44 | 24 |  |  |  |  | 38 | $index_at_seq1 = $i; | 
| 45 | 24 |  |  |  |  | 41 | last L1; | 
| 46 |  |  |  |  |  |  | } | 
| 47 |  |  |  |  |  |  |  | 
| 48 | 32 |  |  |  |  | 44 | my @combined; | 
| 49 | 32 | 100 |  |  |  | 63 | if (defined $index_at_seq1) { | 
| 50 | 24 |  |  |  |  | 50 | @combined = (@$seq1, @{$seq2}[ ($#{$seq1} - $index_at_seq1 + 1) .. $#{$seq2} ]); | 
|  | 24 |  |  |  |  | 55 |  | 
|  | 24 |  |  |  |  | 46 |  | 
|  | 24 |  |  |  |  | 32 |  | 
| 51 |  |  |  |  |  |  | } else { | 
| 52 | 8 |  |  |  |  | 26 | @combined = (@$seq1, @$seq2); | 
| 53 |  |  |  |  |  |  | } | 
| 54 | 32 |  |  |  |  | 62 | $seq1 = \@combined; | 
| 55 |  |  |  |  |  |  |  | 
| 56 | 32 |  |  |  |  | 55 | push @detail_res, \@overlap_items, $index_at_seq1; | 
| 57 | 32 |  |  |  |  | 86 | push @all_overlap_items, \@overlap_items; | 
| 58 |  |  |  |  |  |  | } # SEQ | 
| 59 |  |  |  |  |  |  |  | 
| 60 | 28 | 100 |  |  |  | 52 | if ($action eq 'find') { | 
| 61 | 14 | 100 |  |  |  | 25 | if ($detail) { | 
| 62 | 7 |  |  |  |  | 43 | return @detail_res; | 
| 63 |  |  |  |  |  |  | } else { | 
| 64 | 7 | 100 |  |  |  | 14 | if ($num_seqs > 2) { | 
| 65 | 1 |  |  |  |  | 8 | return @all_overlap_items; | 
| 66 |  |  |  |  |  |  | } else { | 
| 67 | 6 |  |  |  |  | 7 | return @{ $all_overlap_items[0] }; | 
|  | 6 |  |  |  |  | 46 |  | 
| 68 |  |  |  |  |  |  | } | 
| 69 |  |  |  |  |  |  | } | 
| 70 |  |  |  |  |  |  | } else { | 
| 71 |  |  |  |  |  |  | # combine | 
| 72 | 14 | 100 |  |  |  | 25 | if ($detail) { | 
| 73 | 7 |  |  |  |  | 80 | return ($seq1, @detail_res); | 
| 74 |  |  |  |  |  |  | } else { | 
| 75 | 7 |  |  |  |  | 59 | return @$seq1; | 
| 76 |  |  |  |  |  |  | } | 
| 77 |  |  |  |  |  |  | } | 
| 78 |  |  |  |  |  |  | } | 
| 79 |  |  |  |  |  |  |  | 
| 80 | 14 |  |  | 14 | 1 | 1112 | sub find_overlap    { _find_or_combine_overlap('find', @_) } | 
| 81 |  |  |  |  |  |  |  | 
| 82 | 14 |  |  | 14 | 1 | 3022 | sub combine_overlap { _find_or_combine_overlap('combine', @_) } | 
| 83 |  |  |  |  |  |  |  | 
| 84 |  |  |  |  |  |  | 1; | 
| 85 |  |  |  |  |  |  | # ABSTRACT: Find/remove overlapping items among ordered sequences | 
| 86 |  |  |  |  |  |  |  | 
| 87 |  |  |  |  |  |  | __END__ |